	.set noreorder
	.set noat
	.arch sw3
	#  /usr/sz/swcc/lib/gcc-lib/alpha-swcc-linux/3.1.0-483/be::3.1.0-483

	#-----------------------------------------------------------
	# Compiling 3d7p_reuse_v1_unhide.c (/tmp/ccI.QVNjIf)
	#-----------------------------------------------------------

	#-----------------------------------------------------------
	# Options:
	#-----------------------------------------------------------
	#  Target:SW3, ISA:ISA_1, Pointer Size:64
	#  -O3	(Optimization level)
	#  -g0	(Debug level)
	#  -m1	(Report warnings)
	#-----------------------------------------------------------


	.section .bss, "wa", "nobits"
	.align	3

	.section .tdata, "wa", "progbits"
	.align	0

	.section .tdata_local, "wa", "progbits"
	.align	4

	.section .tdata_local_fix, "wa", "progbits"
	.align	4

	.section .text1, "ax", "progbits"
	.align	4

	.section .bss
	.org 0x0
	.align	0
	.type	global_pad_0_74, @object
	.size	global_pad_0_74, 17203
global_pad_0_74:	# 0x0
	.skip 17203
	.section .text1

	# Program Unit: rtc_
	.align 4
	.ent	rtc_#
	.globl	rtc_
rtc_:	# 0x0
	# return_address = 0
#Block: 1 Pred: Succ: 2 
	.file	1 "/mnt/export/base/caoj1/mysvn/SW_DAG/src/examples/3d7p-2d/3d7p-ldm-manager-version/3d7p_2d/3d7p_reuse_v1_unhide.c"
	.loc	1	54	0
#  50  extern unsigned long slave_dma_count[64];
#  51  extern unsigned long slave_comp_count[64];
#  52  extern unsigned long slave_comp_dma_count[64];
#  53  unsigned long rtc_()
#  54  {
.L_BB1_rtc_:	# 0x0
#<freq>
#<freq> BB:1 frequency = 1.00000 (heuristic)
#<freq>
	ldih	$gp,0($27)               	!gpdisp!1	# [0]  0
	ldi	$gp,0($gp)                	!gpdisp!1	# [1]  0
	
$ng..rtc_:
	ldi	$sp,-16($sp)              	# [2]  
	rcsr  $0,4
#Block: 2 Pred: 1 Succ: 
.L_BB2_rtc_:	# 0x24
#<freq>
#<freq> BB:2 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	57	0
#  55    unsigned long rpcc;
#  56    asm volatile("rcsr  %0,4":"=r"(rpcc));
#  57    return rpcc;
	ldi	$sp,16($sp)               	# [0]  
	ret	$31,($26),1               	# [0]  
.L_CC_rtc_:
#PU cycle count: 4.000000
	.end	rtc_

	.section .tdata_local
	.org 0x0
	.align	0
	.globl	get_reply
	.type	get_reply, @object
	.size	get_reply, 8
get_reply:	# 0x0
	.skip 8
	# end of initialization for get_reply
	.org 0x8
	.align	0
	.globl	get_reply1
	.type	get_reply1, @object
	.size	get_reply1, 8
get_reply1:	# 0x8
	.skip 8
	# end of initialization for get_reply1
	.org 0x10
	.align	0
	.globl	get_reply2
	.type	get_reply2, @object
	.size	get_reply2, 8
get_reply2:	# 0x10
	.skip 8
	# end of initialization for get_reply2
	.org 0x18
	.align	0
	.globl	put_reply
	.type	put_reply, @object
	.size	put_reply, 8
put_reply:	# 0x18
	.skip 8
	# end of initialization for put_reply
	.org 0x20
	.align	0
	.globl	core_id
	.type	core_id, @object
	.size	core_id, 4
core_id:	# 0x20
	# offset 32
	.long	0
	# end of initialization for core_id
	.org 0x28
	.align	0
	.globl	start
	.type	start, @object
	.size	start, 8
start:	# 0x28
	.skip 8
	# end of initialization for start
	.org 0x30
	.align	0
	.globl	end
	.type	end, @object
	.size	end, 8
end:	# 0x30
	.skip 8
	# end of initialization for end
	.org 0x38
	.align	0
	.globl	dma_start
	.type	dma_start, @object
	.size	dma_start, 8
dma_start:	# 0x38
	.skip 8
	# end of initialization for dma_start
	.org 0x40
	.align	0
	.globl	dma_end
	.type	dma_end, @object
	.size	dma_end, 8
dma_end:	# 0x40
	.skip 8
	# end of initialization for dma_end
	.org 0x48
	.align	0
	.globl	comp_st
	.type	comp_st, @object
	.size	comp_st, 8
comp_st:	# 0x48
	.skip 8
	# end of initialization for comp_st
	.org 0x50
	.align	0
	.globl	comp_et
	.type	comp_et, @object
	.size	comp_et, 8
comp_et:	# 0x50
	.skip 8
	# end of initialization for comp_et
	.org 0x58
	.align	0
	.globl	dma_et
	.type	dma_et, @object
	.size	dma_et, 8
dma_et:	# 0x58
	.skip 8
	# end of initialization for dma_et
	.org 0x60
	.align	0
	.globl	dma_st
	.type	dma_st, @object
	.size	dma_st, 8
dma_st:	# 0x60
	.skip 8
	# end of initialization for dma_st
	.org 0x68
	.align	0
	.globl	dma_et_
	.type	dma_et_, @object
	.size	dma_et_, 8
dma_et_:	# 0x68
	.skip 8
	# end of initialization for dma_et_
	.org 0x70
	.align	0
	.globl	dma_st_
	.type	dma_st_, @object
	.size	dma_st_, 8
dma_st_:	# 0x70
	.skip 8
	# end of initialization for dma_st_

	.section .tdata_local_fix
	.org 0x0
	.align	0
	.globl	slave
	.type	slave, @object
	.size	slave, 15680
slave:	# 0x0
	.skip 15680
	# end of initialization for slave
	.org 0x3d40
	.align	0
	.globl	A_us
	.type	A_us, @object
	.size	A_us, 1120
A_us:	# 0x3d40
	.skip 1120
	# end of initialization for A_us
	.org 0x41a0
	.align	0
	.globl	A_ds
	.type	A_ds, @object
	.size	A_ds, 1120
A_ds:	# 0x41a0
	.skip 1120
	# end of initialization for A_ds
	.org 0x4600
	.align	0
	.globl	A_ls
	.type	A_ls, @object
	.size	A_ls, 1120
A_ls:	# 0x4600
	.skip 1120
	# end of initialization for A_ls
	.org 0x4a60
	.align	0
	.globl	A_rs
	.type	A_rs, @object
	.size	A_rs, 1120
A_rs:	# 0x4a60
	.skip 1120
	# end of initialization for A_rs
	.org 0x4ec0
	.align	0
	.globl	A_fs
	.type	A_fs, @object
	.size	A_fs, 392
A_fs:	# 0x4ec0
	.skip 392
	# end of initialization for A_fs
	.org 0x5048
	.align	0
	.globl	A_bs
	.type	A_bs, @object
	.size	A_bs, 392
A_bs:	# 0x5048
	.skip 392
	# end of initialization for A_bs
	.org 0x51d0
	.align	0
	.globl	amt_flag
	.type	amt_flag, @object
	.size	amt_flag, 4
amt_flag:	# 0x51d0
	# offset 20944
	.long	0
	# end of initialization for amt_flag

	.section .rodata, "a", "progbits"
	.align	3
	.section .text1
	.align 4

	# Program Unit: stencil_core
	.align 4
	.ent	stencil_core#
	.globl	stencil_core
stencil_core:	# 0x20
	# tileno = 32
	# varno = 44
	# reuse = 52
	# return_address = 16
	# gra_spill_temp_0 = 64
	# gra_spill_temp_1 = 72
	# gra_spill_temp_2 = 80
	# gra_spill_temp_3 = 88
	# gra_spill_temp_4 = 96
	# gra_spill_temp_5 = 104
	# gra_spill_temp_6 = 112
	# gra_spill_temp_7 = 120
	# gra_spill_temp_8 = 128
	# gra_spill_temp_9 = 136
	# gra_spill_temp_10 = 144
	# gra_spill_temp_11 = 152
	# gra_spill_temp_12 = 160
	# gra_spill_temp_13 = 168
	# gra_spill_temp_14 = 176
	# gra_spill_temp_15 = 184
	# gra_spill_temp_16 = 192
	# gra_spill_temp_17 = 200
	# gra_spill_temp_18 = 208
	# gra_spill_temp_19 = 216
	# gra_spill_temp_20 = 224
	# gra_spill_temp_21 = 232
	# gra_spill_temp_22 = 240
	# gra_spill_temp_23 = 248
	# gra_spill_temp_24 = 256
	# gra_spill_temp_25 = 264
	# gra_spill_temp_26 = 272
	# gra_spill_temp_27 = 280
	# gra_spill_temp_28 = 288
	# gra_spill_temp_29 = 296
	# gra_spill_temp_30 = 304
	# gra_spill_temp_31 = 312
	# gra_spill_temp_32 = 320
	# gra_spill_temp_33 = 328
	# gra_spill_temp_34 = 336
	# gra_spill_temp_35 = 344
	# gra_spill_temp_36 = 352
	# gra_spill_temp_37 = 360
	# gra_spill_temp_38 = 368
	# gra_spill_temp_39 = 376
	# gra_spill_temp_40 = 384
	# gra_spill_temp_41 = 392
	# gra_spill_temp_42 = 400
	# gra_spill_temp_43 = 408
	# gra_spill_temp_44 = 416
	# gra_spill_temp_45 = 424
	# gra_spill_temp_46 = 432
	# gra_spill_temp_47 = 440
	# gra_spill_temp_48 = 448
	# gra_spill_temp_49 = 456
	# gra_spill_temp_50 = 464
	# gra_spill_temp_51 = 472
	# gra_spill_temp_52 = 480
	# gra_spill_temp_53 = 488
	# gra_spill_temp_54 = 496
	# gra_spill_temp_55 = 504
	# gra_spill_temp_56 = 512
	# gra_spill_temp_57 = 520
	# gra_spill_temp_58 = 528
	# gra_spill_temp_59 = 536
	# gra_spill_temp_60 = 544
	# gra_spill_temp_61 = 552
	# gra_spill_temp_62 = 560
	# gra_spill_temp_63 = 568
	# gra_spill_temp_64 = 576
	# gra_spill_temp_65 = 584
	# gra_spill_temp_66 = 592
	# gra_spill_temp_67 = 600
	# gra_spill_temp_68 = 608
	# gra_spill_temp_69 = 616
	# gra_spill_temp_70 = 624
	# gra_spill_temp_71 = 632
	# gra_spill_temp_72 = 640
	# gra_spill_temp_73 = 648
	# gra_spill_temp_74 = 656
	# gra_spill_temp_75 = 664
	# gra_spill_temp_76 = 672
	# gra_spill_temp_77 = 680
	# gra_spill_temp_78 = 688
	# gra_spill_temp_79 = 696
	# gra_spill_temp_80 = 704
	# gra_spill_temp_81 = 712
	# gra_spill_temp_82 = 720
	# gra_spill_temp_83 = 728
	# gra_spill_temp_84 = 736
	# gra_spill_temp_85 = 744
	# gra_spill_temp_86 = 752
	# gra_spill_temp_87 = 760
	# gra_spill_temp_88 = 768
	# gra_spill_temp_89 = 776
	# gra_spill_temp_90 = 784
	# gra_spill_temp_91 = 792
	# gra_spill_temp_92 = 800
	# gra_spill_temp_93 = 808
	# lgra_spill_temp_94 = 816
#Block: 1 Pred: Succ: 2 
	.loc	1	62	0
#  58  }
#  59  #endif
#  60  
#  61  void stencil_core(targs* args)
#  62  {  
.L_BB1_stencil_core:	# 0x20
#<freq>
#<freq> BB:1 frequency = 1.00000 (heuristic)
#<freq>
	ldih	$gp,0($27)               	!gpdisp!2	# [0]  0
	ldi	$gp,0($gp)                	!gpdisp!2	# [1]  0
	
$ng..stencil_core:
	ldi	$sp,-832($sp)             	# [2]  
	stl	$16,392($sp)              	# [3]  gra_spill_temp_41
	.loc	1	76	0
#  72    int reuse[2];
#  73    int lhs_no,rhs_no;
#  74    int core_dma_num = 0;
#  75  #ifdef _PROFILING
#  76    core_id = athread_get_id(-1);
	ldi	$16,-1($31)               	# [3]  
	.frame $30,832,$26,0
	.mask 0x4000000,-816
	stl	$11,776($sp)              	# [4]  gra_spill_temp_89
	.loc	1	62	0
	stl	$26,16($sp)               	# [5]  return_address
	.loc	1	76	0
	.prologue
	.globl	athread_get_id
	bsr	$26,athread_get_id        	# [6]  athread_get_id
#Block: 2 Pred: 1 Succ: 3 
.L_BB2_stencil_core:	# 0x4c
#<freq>
#<freq> BB:2 frequency = 1.00000 (heuristic)
#<freq>
#	.spillsp $11, 0
	ldi	$11,core_id($31)          	!tprello	# [0]  core_id
	stl	$9,768($sp)               	# [0]  gra_spill_temp_88
	stw	$0,0($11)                 	# [1]  id:1363 core_id+0x0
	stl	$14,784($sp)              	# [2]  gra_spill_temp_90
	.loc	1	77	0
#  77    start=rtc_();
#	.spillsp $9, 0
	bsr	$26,$ng..rtc_             	# [3]  rtc_
#Block: 3 Pred: 2 Succ: 4 6 
.L_BB3_stencil_core:	# 0x60
#<freq>
#<freq> BB:3 frequency = 1.00000 (heuristic)
#<freq> BB:3 => BB:4 probability = 0.04211
#<freq> BB:3 => BB:6 probability = 0.95789
#<freq>
	.loc	1	79	0
#  78  #endif
#  79    s_iter = args->iter;
	ldl	$2,392($sp)               	# [0]  gra_spill_temp_41
	.loc	1	77	0
#	.spillsp $14, 0
	ldi	$14,start($31)            	!tprello	# [0]  start
	stl	$0,0($14)                 	# [1]  id:1364 start+0x0
	ldi	$1,amt_flag($31)          	!tprello	# [1]  amt_flag
	stl	$1,64($sp)                	# [2]  gra_spill_temp_0
	.loc	1	87	0
#  83    s_endi = args->endi;
#  84    s_startj = args->startj;
#  85    s_endj = args->endj;
#  86    s_startk = 1;
#  87    s_endk = args->k_N-1;
	ldw	$1,0($1)                  	# [3]  id:1371 amt_flag+0x0
	.loc	1	79	0
	ldw	$9,20($2)                 	# [4]  id:1365
	.loc	1	82	0
	ldw	$6,0($2)                  	# [5]  id:1366
	.loc	1	84	0
	ldw	$5,8($2)                  	# [6]  id:1368
	.loc	1	83	0
	ldw	$4,4($2)                  	# [7]  id:1367
	.loc	1	85	0
	ldw	$3,12($2)                 	# [8]  id:1369
	.loc	1	87	0
	ldw	$2,16($2)                 	# [9]  id:1370
	.loc	1	84	0
	stl	$5,464($sp)               	# [10]  gra_spill_temp_50
	.loc	1	87	0
	subw	$2,1,$2                  	# [13]  
	stl	$2,664($sp)               	# [14]  gra_spill_temp_75
	.loc	1	85	0
	stl	$3,288($sp)               	# [15]  gra_spill_temp_28
	.loc	1	83	0
	stl	$4,256($sp)               	# [16]  gra_spill_temp_24
	.loc	1	82	0
	stl	$6,520($sp)               	# [17]  gra_spill_temp_57
	stl	$10,232($sp)              	# [18]  gra_spill_temp_21
	stl	$11,240($sp)              	# [19]  gra_spill_temp_22
	stl	$12,248($sp)              	# [20]  gra_spill_temp_23
	.loc	1	87	0
#	.spillsp $10, 0
#<bpre> branch predict not taken
	beq	$1,.L_BB4_stencil_core    	# [21]  
#Block: 6 Pred: 5 3 Succ: 7 
.Lt_1_116:	# 0xb8
#<freq>
#<freq> BB:6 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	102	0
#  98    }
#  99    tileno[0]=s_starti/BLKX;
# 100    tileno[1]=s_startj/BLKY;
# 101    tileno[2]=s_startk/BLKZ;
# 102    slave_ldm_postreq_tile(s_iter, &A[dest][0][0][0], tileno, OUT);//
	subw	$31,$9,$21               	# [0]  
	.loc	1	99	0
#	.spillsp $12, 0
	ldl	$8,520($sp)               	# [0]  gra_spill_temp_57
	.loc	1	102	0
	selge	$9,$9,$21,$21           	# [1]  
	.loc	1	100	0
	ldl	$7,464($sp)               	# [1]  gra_spill_temp_50
	.loc	1	102	0
	and	$21,1,$21                 	# [2]  
	ldi	$10,560($31)              	# [2]  
	subw	$31,$21,$23              	# [3]  
	ldih	$10,786($10)             	# [3]  
	selge	$9,$21,$23,$21          	# [4]  
	.loc	1	99	0
	ldi	$23,9363($31)             	# [4]  
	.loc	1	102	0
	sra	$21,32,$24                	# [5]  
	sra	$10,32,$17                	# [5]  
	.loc	1	100	0
	subw	$31,$7,$22               	# [6]  
	.loc	1	99	0
	subw	$31,$8,$20               	# [6]  
	selge	$8,$8,$20,$20           	# [7]  
	ldih	$23,-28087($23)          	# [7]  
	.loc	1	100	0
	selge	$7,$7,$22,$22           	# [8]  
	.loc	1	102	0
	mov	$21,$12                   	# [8]  
	mulw	$21,$17,$17              	# [9]  
	.loc	1	97	0
	.globl	A
	ldl	$11,A($gp)                	!literal	# [9]  A
	.loc	1	102	0
	mulw	$10,$24,$24              	# [10]  
	.loc	1	101	0
	stw	$31,40($sp)               	# [10]  tileno+8
	.loc	1	100	0
	umulw	$22,$23,$22             	# [11]  
	.loc	1	102	0
	mov	2,$19                     	# [11]  
	.loc	1	99	0
	umulw	$20,$23,$20             	# [12]  
	.loc	1	102	0
	mov	$9,$16                    	# [12]  
	umulw	$21,$10,$21             	# [13]  
	ldi	$18,32($sp)               	# [13]  tileno
	addl	$17,$24,$17              	# [15]  
	.loc	1	100	0
	srl	$22,34,$22                	# [16]  
	.loc	1	102	0
	sll	$17,32,$17                	# [17]  
	.loc	1	99	0
	srl	$20,34,$20                	# [17]  
	.loc	1	102	0
	addl	$17,$21,$17              	# [18]  
	.loc	1	99	0
	subw	$31,$20,$21              	# [18]  
	.loc	1	100	0
	subw	$31,$22,$23              	# [19]  
	.loc	1	99	0
	selge	$8,$20,$21,$8           	# [19]  
	.loc	1	100	0
	selge	$7,$22,$23,$7           	# [20]  
	.loc	1	99	0
	stw	$8,32($sp)                	# [20]  tileno
	.loc	1	100	0
	stw	$7,36($sp)                	# [21]  tileno+4
	.loc	1	102	0
	stl	$17,304($sp)              	# [22]  gra_spill_temp_30
	addl	$17,$11,$17              	# [22]  
	.globl	slave_ldm_postreq_tile
	bsr	$26,slave_ldm_postreq_tile 	# [23]  slave_ldm_postreq_tile
#Block: 7 Pred: 6 Succ: 8 
.L_BB7_stencil_core:	# 0x160
#<freq>
#<freq> BB:7 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	103	0
# 103    slave_ldm_postreq_tile(s_iter, &A[src][0][0][0], tileno, IN);
	ldi	$20,-560($31)             	# [0]  
	sra	$12,32,$21                	# [0]  
	ldih	$20,-786($20)            	# [1]  
	mov	1,$19                     	# [1]  
	sra	$20,32,$17                	# [2]  
	mulw	$20,$21,$21              	# [2]  
	mulw	$12,$17,$17              	# [3]  
	mov	$9,$16                    	# [3]  
	umulw	$12,$20,$20             	# [4]  
	ldi	$18,32($sp)               	# [4]  tileno
	addl	$17,$21,$17              	# [8]  
	sll	$17,32,$17                	# [9]  
	addl	$17,$20,$17              	# [10]  
	stl	$17,456($sp)              	# [11]  gra_spill_temp_49
	addl	$17,$11,$17              	# [11]  
	addl	$17,$10,$17              	# [12]  
	.globl	slave_ldm_postreq_tile
	bsr	$26,slave_ldm_postreq_tile 	# [12]  slave_ldm_postreq_tile
#Block: 8 Pred: 7 Succ: 9 
.L_BB8_stencil_core:	# 0x1a4
#<freq>
#<freq> BB:8 frequency = 1.00000 (heuristic)
#<freq>
	stl	$13,760($sp)              	# [0]  gra_spill_temp_87
	.loc	1	104	0
# 104    slave_ldm_getrep(2,varno,reuse);
	ldi	$17,44($sp)               	# [0]  varno
	mov	2,$16                     	# [1]  
#	.spillsp $13, 0
	ldi	$18,52($sp)               	# [1]  reuse
	.globl	slave_ldm_getrep
	bsr	$26,slave_ldm_getrep      	# [2]  slave_ldm_getrep
#Block: 9 Pred: 8 Succ: 10 
.L_BB9_stencil_core:	# 0x1b8
#<freq>
#<freq> BB:9 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	106	0
# 105    lhs_no = varno[0];
# 106    rhs_no = varno[1];
	ldw	$13,48($sp)               	# [64]  varno+4
	.loc	1	105	0
	ldw	$9,44($sp)                	# [65]  varno
	.loc	1	108	0
# 107  #ifdef _PROFILING
# 108    dma_st=rtc_();
	bsr	$26,$ng..rtc_             	# [66]  rtc_
#Block: 10 Pred: 9 Succ: 11 13 
.L_BB10_stencil_core:	# 0x1c4
#<freq>
#<freq> BB:10 frequency = 1.00000 (heuristic)
#<freq> BB:10 => BB:11 probability = 0.05098
#<freq> BB:10 => BB:13 probability = 0.94902
#<freq>
	ldi	$21,dma_st($31)           	!tprello	# [0]  dma_st
	ldi	$12,get_reply($31)        	!tprello	# [0]  get_reply
	stl	$0,0($21)                 	# [1]  id:1377 dma_st+0x0
	.loc	1	111	0
# 109  #endif
# 110    //1 update core data
# 111    get_reply=0;
	stl	$31,0($12)                	# [2]  id:1378 get_reply+0x0
	.loc	1	108	0
	stl	$21,416($sp)              	# [3]  gra_spill_temp_44
	stl	$9,272($sp)               	# [4]  gra_spill_temp_26
	.loc	1	111	0
#<bpre> branch predict not taken
	blt	$13,.L_BB11_stencil_core  	# [5]  
#Block: 13 Pred: 10 Succ: 14 22 
.Lt_1_119:	# 0x1e0
#<freq>
#<freq> BB:13 frequency = 0.94902 (heuristic)
#<freq> BB:13 => BB:14 probability = 0.16000
#<freq> BB:13 => BB:22 probability = 0.84000
#<freq>
	.loc	1	113	0
# 112    if(rhs_no <0)
# 113      printf("Array assignment failed\n");
	ldl	$23,520($sp)              	# [0]  gra_spill_temp_57
	ldl	$24,256($sp)              	# [1]  gra_spill_temp_24
	ldw	$22,56($sp)               	# [2]  reuse+4
	cmplt	$23,$24,$23             	# [5]  
	stl	$23,448($sp)              	# [6]  gra_spill_temp_48
	stl	$14,280($sp)              	# [7]  gra_spill_temp_27
#<bpre> branch predict not taken
	beq	$22,.L_BB14_stencil_core  	# [9]  
#Block: 22 Pred: 13 Succ: 23 
.Lt_1_121:	# 0x1fc
#<freq>
#<freq> BB:22 frequency = 0.79717 (heuristic)
#<freq>
	.loc	1	123	0
# 119         athread_get(PE_MODE,&A[src][i][s_startj][s_startk]
# 120                   , &slave[rhs_no][i-s_starti][0][0]
# 121                   , len, &get_reply
# 122                   , 0, stride, bsize);
# 123      core_dma_num+=(s_endi-s_starti);
	ldl	$17,464($sp)              	# [0]  gra_spill_temp_50
	sll	$13,5,$20                 	# [0]  
	s8subl	$20,$20,$20            	# [1]  
	ldl	$16,520($sp)              	# [1]  gra_spill_temp_57
	ldl	$14,256($sp)              	# [2]  gra_spill_temp_24
	s8subl	$20,$20,$20            	# [2]  
	s4addl	$20,$20,$20            	# [3]  
	ldi	$19,slave($31)            	!tprello	# [3]  slave
	sll	$17,4,$17                 	# [4]  
	stl	$19,712($sp)              	# [4]  gra_spill_temp_81
	s8subl	$17,$17,$18            	# [5]  
	addl	$19,$20,$19              	# [5]  
	s4addl	$17,$18,$17            	# [6]  
	stl	$19,424($sp)              	# [6]  gra_spill_temp_45
	stl	$17,216($sp)              	# [7]  gra_spill_temp_19
	subw	$14,$16,$14              	# [7]  
	stl	$15,264($sp)              	# [8]  gra_spill_temp_25
	mov	$31,$5                    	# [8]  
#Block: 23 Pred: 12 22 193 20 Succ: 24 30 
.Lt_1_120:	# 0x244
.Lt_1_118:	# 0x244
#<freq>
#<freq> BB:23 frequency = 1.00000 (heuristic)
#<freq> BB:23 => BB:24 probability = 0.78423
#<freq> BB:23 => BB:30 probability = 0.21577
#<freq>
	.loc	1	126	0
# 124   }
# 125    //2 update front and back shade data
# 126    get_reply1 = 0;
	ldl	$18,448($sp)              	# [0]  gra_spill_temp_48
	.loc	1	123	0
#	.spillsp $15, 0
	ldi	$15,get_reply1($31)       	!tprello	# [0]  get_reply1
	.loc	1	126	0
	stl	$31,0($15)                	# [1]  id:1380 get_reply1+0x0
#<bpre> branch predict not taken
	beq	$18,.Lt_1_129             	# [4]  
#Block: 24 Pred: 23 Succ: 202 
.L_BB24_stencil_core:	# 0x254
#<freq>
#<freq> BB:24 frequency = 0.78423 (heuristic)
#<freq>
	stl	$13,112($sp)              	# [0]  gra_spill_temp_6
	ldi	$9,29680($31)             	# [0]  
	ldl	$13,520($sp)              	# [1]  gra_spill_temp_57
	ldih	$9,1($9)                 	# [1]  
	ldl	$11,456($sp)              	# [2]  gra_spill_temp_49
	sll	$13,4,$16                 	# [5]  
	s4subl	$16,$16,$17            	# [6]  
	stl	$12,808($sp)              	# [6]  gra_spill_temp_93
	s4addl	$16,$16,$12            	# [7]  
	subl	$31,$16,$16              	# [7]  
	s4addl	$12,$17,$12            	# [8]  
	sll	$13,8,$13                 	# [8]  
	ldl	$10,216($sp)              	# [9]  gra_spill_temp_19
	s4addl	$13,$16,$13            	# [9]  
	sll	$12,8,$12                 	# [10]  
	ldl	$4,664($sp)               	# [10]  gra_spill_temp_75
	addl	$12,$13,$12              	# [11]  
	ldl	$16,A($gp)                	!literal	# [11]  A
	addl	$11,$12,$11              	# [12]  
	ldi	$12,A_bs($31)             	!tprello	# [12]  A_bs
	addl	$10,$11,$10              	# [13]  
	ldi	$13,A_fs($31)             	!tprello	# [13]  A_fs
	s8addl	$4,$10,$11             	# [14]  
	s8addl	$4,$31,$4              	# [14]  
	addl	$11,$16,$11              	# [15]  
	addl	$10,$16,$10              	# [15]  
	ldi	$16,560($31)              	# [16]  
	stl	$13,536($sp)              	# [16]  gra_spill_temp_59
	ldih	$16,786($16)             	# [17]  
	stl	$12,528($sp)              	# [17]  gra_spill_temp_58
	addl	$10,$16,$10              	# [18]  
	addl	$11,$16,$11              	# [18]  
	stl	$31,728($sp)              	# [19]  gra_spill_temp_83
#Block: 202 Pred: 24 Succ: 26 
.L_BB202_stencil_core:	# 0x2d8
#<freq>
#<freq> BB:202 frequency = 0.78423 (heuristic)
#<freq>
	stl	$4,144($sp)               	# [0]  gra_spill_temp_10
	stl	$5,752($sp)               	# [1]  gra_spill_temp_86
#Block: 26 Pred: 28 202 Succ: 27 
	.align	4
.Lt_1_132:	# 0x2e0
#<loop> Loop body line 126, nesting depth: 1, estimated iterations: 100
#<freq>
#<freq> BB:26 frequency = 78.42324 (heuristic)
#<freq>
	.loc	1	135	0
# 131    {
# 132       athread_get(PE_MODE,&A[src][i][s_startj][s_startk-1]
# 133                     , &A_fs[i-s_starti][0]
# 134                     , len,&get_reply1
# 135                     , 0, stride, bsize);
	mov	8,$16                     	# [0]  
	mov	168,$17                   	# [0]  
	stl	$17,0($sp)                	# [1]  id:1813
	mov	$31,$21                   	# [1]  
	stl	$16,8($sp)                	# [2]  id:1814
	mov	$15,$20                   	# [2]  
	mov	56,$19                    	# [3]  
	mov	$13,$18                   	# [3]  
	mov	$10,$17                   	# [4]  
	mov	$31,$16                   	# [4]  
	.globl	athread_get
	bsr	$26,athread_get           	# [5]  athread_get
#Block: 27 Pred: 26 Succ: 28 
.L_BB27_stencil_core:	# 0x30c
#<loop> Part of loop body line 126, head labeled .Lt_1_132
#<freq>
#<freq> BB:27 frequency = 78.42324 (heuristic)
#<freq>
	.loc	1	139	0
# 136       athread_get(PE_MODE,&A[src][i][s_startj][s_endk]
# 137                     , &A_bs[i-s_starti][0]
# 138                     , len,&get_reply1
# 139                     , 0, stride, bsize); 
	mov	8,$18                     	# [5]  
	mov	168,$19                   	# [5]  
	stl	$19,0($sp)                	# [6]  id:1815
	mov	$31,$21                   	# [6]  
	stl	$18,8($sp)                	# [7]  id:1816
	mov	$15,$20                   	# [7]  
	mov	56,$19                    	# [8]  
	mov	$12,$18                   	# [8]  
	mov	$11,$17                   	# [9]  
	mov	$31,$16                   	# [9]  
	.globl	athread_get
	bsr	$26,athread_get           	# [10]  athread_get
#Block: 28 Pred: 27 Succ: 26 203 
.L_BB28_stencil_core:	# 0x338
#<loop> Part of loop body line 126, head labeled .Lt_1_132
#<freq>
#<freq> BB:28 frequency = 78.42324 (heuristic)
#<freq> BB:28 => BB:26 probability = 0.99000
#<freq> BB:28 => BB:203 probability = 0.01000
#<freq>
	ldl	$20,728($sp)              	# [0]  gra_spill_temp_83
	ldi	$12,56($12)               	# [0]  
	ldi	$13,56($13)               	# [1]  
	addl	$11,$9,$11               	# [1]  
	addl	$10,$9,$10               	# [2]  
	addw	$20,1,$20                	# [4]  
	stl	$20,728($sp)              	# [5]  gra_spill_temp_83
	cmpeq	$20,$14,$20             	# [5]  
#<bpre> branch predict taken
	beq	$20,.Lt_1_132             	# [6]  
#Block: 203 Pred: 28 Succ: 194 
.L_BB203_stencil_core:	# 0x35c
#<freq>
#<freq> BB:203 frequency = 0.78423 (heuristic)
#<freq>
#Block: 194 Pred: 203 Succ: 31 
.L_BB194_stencil_core:	# 0x35c
#<freq>
#<freq> BB:194 frequency = 0.78423 (heuristic)
#<freq>
	ldl	$13,112($sp)              	# [0]  gra_spill_temp_6
	ldl	$11,A($gp)                	!literal	# [1]  A
	ldl	$12,808($sp)              	# [2]  gra_spill_temp_93
#Block: 31 Pred: 30 194 Succ: 204 33 
.Lt_1_128:	# 0x368
#<freq>
#<freq> BB:31 frequency = 1.00000 (heuristic)
#<freq> BB:31 => BB:204 probability = 0.75000
#<freq> BB:31 => BB:33 probability = 0.25000
#<freq>
	ldl	$4,752($sp)               	# [0]  gra_spill_temp_86
	ldl	$21,0($12)                	# [1]  id:1378 get_reply+0x0
	cmpeq	$4,$21,$21              	# [5]  
#<bpre> branch predict not taken
	bne	$21,.Lt_1_134             	# [6]  
#Block: 204 Pred: 31 Succ: 206 
.L_BB204_stencil_core:	# 0x378
#<freq>
#<freq> BB:204 frequency = 0.75000 (heuristic)
#<freq>
#Block: 206 Pred: 32 204 Succ: 205 207 
.L_BB206_stencil_core:	# 0x378
#<loop> Loop body line 139
#<loop> unrolled 3 times
#<freq>
#<freq> BB:206 frequency = 2.75000 (heuristic)
#<freq> BB:206 => BB:205 probability = 0.12000
#<freq> BB:206 => BB:207 probability = 0.88000
#<freq>
	ldl	$22,0($12)                	# [0]  id:1378 get_reply+0x0
	cmpeq	$4,$22,$22              	# [4]  
#<bpre> branch predict not taken
	bne	$22,.L_BB205_stencil_core 	# [5]  
#Block: 207 Pred: 206 Succ: 205 32 
.L_BB207_stencil_core:	# 0x384
#<loop> Part of loop body line 139, head labeled .L_BB206_stencil_core
#<loop> unrolled 3 times
#<freq>
#<freq> BB:207 frequency = 2.42000 (heuristic)
#<freq> BB:207 => BB:205 probability = 0.12000
#<freq> BB:207 => BB:32 probability = 0.88000
#<freq>
	ldl	$23,0($12)                	# [5]  id:1378 get_reply+0x0
	cmpeq	$4,$23,$23              	# [9]  
#<bpre> branch predict not taken
	bne	$23,.L_BB205_stencil_core 	# [10]  
#Block: 32 Pred: 207 Succ: 205 206 
.Lt_1_136:	# 0x390
#<loop> Part of loop body line 139, head labeled .L_BB206_stencil_core
#<freq>
#<freq> BB:32 frequency = 2.12960 (heuristic)
#<freq> BB:32 => BB:205 probability = 0.12000
#<freq> BB:32 => BB:206 probability = 0.88000
#<freq>
	ldl	$24,0($12)                	# [10]  id:1378 get_reply+0x0
	cmpeq	$4,$24,$24              	# [14]  
#<bpre> branch predict taken
	beq	$24,.L_BB206_stencil_core 	# [15]  
#Block: 205 Pred: 32 206 207 Succ: 33 
.L_BB205_stencil_core:	# 0x39c
#<freq>
#<freq> BB:205 frequency = 0.75000 (heuristic)
#<freq>
#Block: 33 Pred: 205 31 Succ: 34 
.Lt_1_134:	# 0x39c
#<freq>
#<freq> BB:33 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	152	0
# 148    bsize = (BLKZ)*8;
# 149    athread_get(PE_MODE,&A[src][s_starti-1][s_startj][s_startk]
# 150                   , &A_us[0][0]
# 151                   , len, &get_reply2
# 152                   , 0, stride, bsize);
	ldl	$19,520($sp)              	# [0]  gra_spill_temp_57
	.loc	1	139	0
	ldi	$9,get_reply2($31)        	!tprello	# [0]  get_reply2
	.loc	1	152	0
	ldl	$17,456($sp)              	# [1]  gra_spill_temp_49
	mov	$31,$16                   	# [1]  
	ldl	$10,216($sp)              	# [2]  gra_spill_temp_19
	sll	$19,4,$20                 	# [4]  
	s4addl	$20,$20,$18            	# [5]  
	s4subl	$20,$20,$21            	# [5]  
	s4addl	$18,$21,$18            	# [6]  
	subl	$31,$20,$20              	# [6]  
	sll	$19,8,$19                 	# [7]  
	sll	$18,8,$18                 	# [7]  
	s4addl	$19,$20,$19            	# [8]  
	mov	160,$20                   	# [8]  
	addl	$18,$19,$18              	# [9]  
	ldi	$19,-29112($31)           	# [9]  
	addl	$17,$18,$17              	# [10]  
	ldih	$19,785($19)             	# [10]  
	stl	$17,408($sp)              	# [11]  gra_spill_temp_43
	addl	$17,$11,$17              	# [11]  
	addl	$10,$17,$17              	# [12]  
	stl	$18,312($sp)              	# [12]  gra_spill_temp_31
	.loc	1	139	0
	ldi	$18,A_us($31)             	!tprello	# [13]  A_us
	.loc	1	152	0
	mov	16,$21                    	# [13]  
	.loc	1	144	0
	stl	$31,0($9)                 	# [14]  id:1381 get_reply2+0x0
	ldl	$12,256($sp)              	# [15]  gra_spill_temp_24
	.loc	1	152	0
	stl	$21,0($sp)                	# [16]  id:1817
	mov	$31,$21                   	# [16]  
	stl	$20,8($sp)                	# [17]  id:1818
	mov	$9,$20                    	# [17]  
	.loc	1	139	0
	stl	$18,600($sp)              	# [18]  gra_spill_temp_67
	.loc	1	152	0
	stl	$17,400($sp)              	# [19]  gra_spill_temp_42
	addl	$17,$19,$17              	# [19]  
	ldi	$19,1120($31)             	# [20]  
	.globl	athread_get
	bsr	$26,athread_get           	# [20]  athread_get
#Block: 34 Pred: 33 Succ: 35 
.L_BB34_stencil_core:	# 0x428
#<freq>
#<freq> BB:34 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	156	0
# 153    athread_get(PE_MODE,&A[src][s_endi][s_startj][s_startk]
# 154                   , &A_ds[0][0]
# 155                   , len, &get_reply2
# 156                   , 0, stride, bsize);
	sll	$12,4,$20                 	# [0]  
	ldl	$17,456($sp)              	# [0]  gra_spill_temp_49
	s4addl	$20,$20,$18            	# [1]  
	s4subl	$20,$20,$21            	# [1]  
	s4addl	$18,$21,$18            	# [2]  
	subl	$31,$20,$20              	# [2]  
	sll	$12,8,$19                 	# [3]  
	sll	$18,8,$18                 	# [3]  
	s4addl	$19,$20,$19            	# [4]  
	mov	160,$20                   	# [4]  
	addl	$18,$19,$18              	# [5]  
	ldi	$19,568($31)              	# [5]  
	addl	$17,$18,$17              	# [6]  
	ldi	$18,A_ds($31)             	!tprello	# [6]  A_ds
	addl	$10,$17,$17              	# [7]  
	ldih	$19,786($19)             	# [7]  
	addl	$11,$17,$17              	# [8]  
	mov	16,$21                    	# [8]  
	stl	$21,0($sp)                	# [9]  id:1819
	mov	$31,$21                   	# [9]  
	addl	$17,$19,$17              	# [10]  
	ldi	$19,1120($31)             	# [10]  
	stl	$18,608($sp)              	# [11]  gra_spill_temp_68
	mov	$31,$16                   	# [11]  
	stl	$20,8($sp)                	# [12]  id:1820
	mov	$9,$20                    	# [12]  
	.globl	athread_get
	bsr	$26,athread_get           	# [13]  athread_get
#Block: 35 Pred: 34 Succ: 36 
.L_BB35_stencil_core:	# 0x494
#<freq>
#<freq> BB:35 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	164	0
# 160    bsize = (BLKZ)*8;
# 161    athread_get(PE_MODE,&A[src][s_starti][s_startj-1][s_startk]
# 162                     , &A_ls[0][0]
# 163                     , len, &get_reply2
# 164                     , 0, stride, bsize);
	ldl	$17,400($sp)              	# [0]  gra_spill_temp_42
	ldi	$19,392($31)              	# [0]  
	ldi	$20,29520($31)            	# [1]  
	ldih	$19,786($19)             	# [1]  
	ldih	$20,1($20)               	# [2]  
	ldi	$18,A_ls($31)             	!tprello	# [2]  A_ls
	mov	160,$21                   	# [3]  
	ldi	$12,568($31)              	# [3]  
	ldih	$12,786($12)             	# [4]  
	stl	$21,8($sp)                	# [4]  id:1822
	mov	$31,$21                   	# [5]  
	stl	$18,584($sp)              	# [5]  gra_spill_temp_65
	stl	$20,0($sp)                	# [6]  id:1821
	mov	$9,$20                    	# [6]  
	addl	$17,$19,$17              	# [7]  
	ldi	$19,1120($31)             	# [7]  
	mov	$31,$16                   	# [8]  
	.globl	athread_get
	bsr	$26,athread_get           	# [8]  athread_get
#Block: 36 Pred: 35 Succ: 37 
.L_BB36_stencil_core:	# 0x4dc
#<freq>
#<freq> BB:36 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	168	0
# 165    athread_get(PE_MODE,&A[src][s_starti][s_endj][s_startk]
# 166                     , &A_rs[0][0]
# 167                     , len,&get_reply2
# 168                     , 0, stride, bsize);    
	ldl	$10,288($sp)              	# [0]  gra_spill_temp_28
	ldi	$16,29520($31)            	# [0]  
	ldl	$17,408($sp)              	# [1]  gra_spill_temp_43
	ldih	$16,1($16)               	# [1]  
	stl	$16,0($sp)                	# [2]  id:1823
	mov	$31,$16                   	# [2]  
	mov	$9,$20                    	# [3]  
	mov	$31,$21                   	# [3]  
	sll	$10,4,$18                 	# [4]  
	s8subl	$18,$18,$19            	# [5]  
	s4addl	$18,$19,$18            	# [6]  
	addl	$17,$18,$17              	# [7]  
	ldi	$18,A_rs($31)             	!tprello	# [7]  A_rs
	addl	$11,$17,$17              	# [8]  
	mov	160,$19                   	# [8]  
	stl	$19,8($sp)                	# [9]  id:1824
	ldi	$19,1120($31)             	# [9]  
	addl	$17,$12,$17              	# [10]  
	stl	$18,592($sp)              	# [10]  gra_spill_temp_66
	.globl	athread_get
	bsr	$26,athread_get           	# [11]  athread_get
#Block: 37 Pred: 36 Succ: 208 39 
.L_BB37_stencil_core:	# 0x52c
#<freq>
#<freq> BB:37 frequency = 1.00000 (heuristic)
#<freq> BB:37 => BB:208 probability = 0.94030
#<freq> BB:37 => BB:39 probability = 0.05970
#<freq>
	ldl	$17,0($9)                 	# [0]  id:1381 get_reply2+0x0
	cmpeq	$17,4,$17               	# [4]  
#<bpre> branch predict not taken
	bne	$17,.Lt_1_138             	# [5]  
#Block: 208 Pred: 37 Succ: 210 
.L_BB208_stencil_core:	# 0x538
#<freq>
#<freq> BB:208 frequency = 0.94030 (heuristic)
#<freq>
#Block: 210 Pred: 38 208 Succ: 209 211 
.L_BB210_stencil_core:	# 0x538
#<loop> Loop body line 168
#<loop> unrolled 3 times
#<freq>
#<freq> BB:210 frequency = 3.27861 (heuristic)
#<freq> BB:210 => BB:209 probability = 0.12000
#<freq> BB:210 => BB:211 probability = 0.88000
#<freq>
	ldl	$18,0($9)                 	# [0]  id:1381 get_reply2+0x0
	cmpeq	$18,4,$18               	# [4]  
#<bpre> branch predict not taken
	bne	$18,.L_BB209_stencil_core 	# [5]  
#Block: 211 Pred: 210 Succ: 209 38 
.L_BB211_stencil_core:	# 0x544
#<loop> Part of loop body line 168, head labeled .L_BB210_stencil_core
#<loop> unrolled 3 times
#<freq>
#<freq> BB:211 frequency = 2.88517 (heuristic)
#<freq> BB:211 => BB:209 probability = 0.12000
#<freq> BB:211 => BB:38 probability = 0.88000
#<freq>
	ldl	$19,0($9)                 	# [5]  id:1381 get_reply2+0x0
	cmpeq	$19,4,$19               	# [9]  
#<bpre> branch predict not taken
	bne	$19,.L_BB209_stencil_core 	# [10]  
#Block: 38 Pred: 211 Succ: 209 210 
.Lt_1_140:	# 0x550
#<loop> Part of loop body line 168, head labeled .L_BB210_stencil_core
#<freq>
#<freq> BB:38 frequency = 2.53895 (heuristic)
#<freq> BB:38 => BB:209 probability = 0.12000
#<freq> BB:38 => BB:210 probability = 0.88000
#<freq>
	ldl	$20,0($9)                 	# [10]  id:1381 get_reply2+0x0
	cmpeq	$20,4,$20               	# [14]  
#<bpre> branch predict taken
	beq	$20,.L_BB210_stencil_core 	# [15]  
#Block: 209 Pred: 38 210 211 Succ: 39 
.L_BB209_stencil_core:	# 0x55c
#<freq>
#<freq> BB:209 frequency = 0.94030 (heuristic)
#<freq>
#Block: 39 Pred: 37 209 Succ: 212 41 
.Lt_1_138:	# 0x55c
#<freq>
#<freq> BB:39 frequency = 1.00000 (heuristic)
#<freq> BB:39 => BB:212 probability = 0.94030
#<freq> BB:39 => BB:41 probability = 0.05970
#<freq>
	ldl	$21,0($15)                	# [0]  id:1380 get_reply1+0x0
	cmpeq	$21,14,$21              	# [4]  
#<bpre> branch predict not taken
	bne	$21,.Lt_1_142             	# [5]  
#Block: 212 Pred: 39 Succ: 214 
.L_BB212_stencil_core:	# 0x568
#<freq>
#<freq> BB:212 frequency = 0.94030 (heuristic)
#<freq>
#Block: 214 Pred: 40 212 Succ: 213 215 
.L_BB214_stencil_core:	# 0x568
#<loop> Loop body line 168
#<loop> unrolled 3 times
#<freq>
#<freq> BB:214 frequency = 3.27861 (heuristic)
#<freq> BB:214 => BB:213 probability = 0.12000
#<freq> BB:214 => BB:215 probability = 0.88000
#<freq>
	ldl	$22,0($15)                	# [0]  id:1380 get_reply1+0x0
	cmpeq	$22,14,$22              	# [4]  
#<bpre> branch predict not taken
	bne	$22,.L_BB213_stencil_core 	# [5]  
#Block: 215 Pred: 214 Succ: 213 40 
.L_BB215_stencil_core:	# 0x574
#<loop> Part of loop body line 168, head labeled .L_BB214_stencil_core
#<loop> unrolled 3 times
#<freq>
#<freq> BB:215 frequency = 2.88517 (heuristic)
#<freq> BB:215 => BB:213 probability = 0.12000
#<freq> BB:215 => BB:40 probability = 0.88000
#<freq>
	ldl	$23,0($15)                	# [5]  id:1380 get_reply1+0x0
	cmpeq	$23,14,$23              	# [9]  
#<bpre> branch predict not taken
	bne	$23,.L_BB213_stencil_core 	# [10]  
#Block: 40 Pred: 215 Succ: 213 214 
.Lt_1_144:	# 0x580
#<loop> Part of loop body line 168, head labeled .L_BB214_stencil_core
#<freq>
#<freq> BB:40 frequency = 2.53895 (heuristic)
#<freq> BB:40 => BB:213 probability = 0.12000
#<freq> BB:40 => BB:214 probability = 0.88000
#<freq>
	ldl	$24,0($15)                	# [10]  id:1380 get_reply1+0x0
	cmpeq	$24,14,$24              	# [14]  
#<bpre> branch predict taken
	beq	$24,.L_BB214_stencil_core 	# [15]  
#Block: 213 Pred: 40 214 215 Succ: 41 
.L_BB213_stencil_core:	# 0x58c
#<freq>
#<freq> BB:213 frequency = 0.94030 (heuristic)
#<freq>
#Block: 41 Pred: 39 213 Succ: 42 
.Lt_1_142:	# 0x58c
#<freq>
#<freq> BB:41 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	174	0
# 170    while(get_reply2 != (2+2));
# 171     //8 wait for front back shade data
# 172    while(get_reply1 != ((BLKX)*2));
# 173  #ifdef _PROFILING
# 174    dma_et=rtc_();
	bsr	$26,$ng..rtc_             	# [0]  rtc_
#Block: 42 Pred: 41 Succ: 43 
.L_BB42_stencil_core:	# 0x590
#<freq>
#<freq> BB:42 frequency = 1.00000 (heuristic)
#<freq>
	ldi	$9,dma_et($31)            	!tprello	# [0]  dma_et
	stl	$0,0($9)                  	# [1]  id:1382 dma_et+0x0
	.loc	1	177	0
# 175  #endif
# 176  #ifdef _PROFILING
# 177    comp_st=rtc_();
	bsr	$26,$ng..rtc_             	# [2]  rtc_
#Block: 43 Pred: 42 Succ: 44 72 
.L_BB43_stencil_core:	# 0x59c
#<freq>
#<freq> BB:43 frequency = 1.00000 (heuristic)
#<freq> BB:43 => BB:44 probability = 0.75000
#<freq> BB:43 => BB:72 probability = 0.25000
#<freq>
	ldi	$8,comp_st($31)           	!tprello	# [0]  comp_st
	mov	4,$16                     	# [0]  
	cmple	$16,$14,$16             	# [1]  
	stl	$0,0($8)                  	# [1]  id:1383 comp_st+0x0
	stl	$9,296($sp)               	# [2]  gra_spill_temp_29
#<bpre> branch predict not taken
	beq	$16,.Lt_1_147             	# [3]  
#Block: 44 Pred: 43 Succ: 46 
.L_BB44_stencil_core:	# 0x5b4
#<freq>
#<freq> BB:44 frequency = 0.75000 (heuristic)
#<freq>
	ldl	$21,272($sp)              	# [0]  gra_spill_temp_26
	ldi	$19,27892($31)            	# [0]  
	ldih	$19,16310($19)           	# [1]  
	ldi	$4,11639($31)             	# [1]  
	ldih	$4,7969($4)              	# [2]  
	sll	$19,32,$19                	# [2]  
	ldl	$23,464($sp)              	# [3]  gra_spill_temp_50
	addl	$4,$19,$4                	# [3]  
	ldl	$19,712($sp)              	# [4]  gra_spill_temp_81
	sll	$21,2,$21                 	# [4]  
	ldl	$7,664($sp)               	# [5]  gra_spill_temp_75
	sll	$13,2,$18                 	# [5]  
	s8subl	$18,$18,$18            	# [6]  
	s8subl	$21,$21,$21            	# [6]  
	ldi	$17,-27263($31)           	# [7]  
	subw	$14,2,$12                	# [7]  
	srl	$12,63,$20                	# [8]  
	ldih	$17,16308($17)           	# [8]  
	s8subl	$21,$21,$21            	# [9]  
	s8subl	$18,$18,$18            	# [9]  
	ldi	$5,-8913($31)             	# [10]  
	s4addl	$18,$18,$18            	# [10]  
	ldih	$5,1573($5)              	# [11]  
	s4addl	$21,$21,$21            	# [11]  
	sll	$17,32,$17                	# [12]  
	addw	$20,$12,$20              	# [12]  
	subw	$10,$23,$23              	# [13]  
	mov	4,$22                     	# [13]  
	mov	4,$27                     	# [14]  
	mov	3,$25                     	# [14]  
	cmple	$25,$23,$25             	# [15]  
	cmple	$27,$23,$27             	# [15]  
	cmple	$22,$7,$22              	# [16]  
	stl	$23,568($sp)              	# [16]  gra_spill_temp_63
	subw	$23,2,$6                 	# [17]  
	subw	$23,4,$24                	# [17]  
	subw	$23,3,$23                	# [18]  
	sra	$20,1,$20                 	# [18]  
	addl	$5,$17,$5                	# [19]  
	subw	$14,4,$17                	# [19]  
	stl	$21,704($sp)              	# [20]  gra_spill_temp_80
	s8addl	$21,$19,$21            	# [20]  
	stl	$18,720($sp)              	# [21]  gra_spill_temp_82
	s8addl	$18,$19,$18            	# [21]  
	stl	$18,496($sp)              	# [22]  gra_spill_temp_54
	subw	$7,3,$7                  	# [22]  
	stl	$21,504($sp)              	# [23]  gra_spill_temp_55
	stl	$17,488($sp)              	# [24]  gra_spill_temp_53
	stl	$20,176($sp)              	# [25]  gra_spill_temp_14
	stl	$23,432($sp)              	# [26]  gra_spill_temp_46
	stl	$24,472($sp)              	# [27]  gra_spill_temp_51
	stl	$22,576($sp)              	# [28]  gra_spill_temp_64
	stl	$27,440($sp)              	# [29]  gra_spill_temp_47
	stl	$25,632($sp)              	# [30]  gra_spill_temp_71
	stl	$8,160($sp)               	# [31]  gra_spill_temp_12
	stl	$16,168($sp)              	# [32]  gra_spill_temp_13
	stl	$31,512($sp)              	# [33]  gra_spill_temp_56
	stl	$31,480($sp)              	# [34]  gra_spill_temp_52
#Block: 46 Pred: 68 44 Succ: 47 57 
.Lt_1_150:	# 0x69c
#<loop> Loop body line 177, nesting depth: 1, estimated iterations: 2
#<freq>
#<freq> BB:46 frequency = 1.50000 (heuristic)
#<freq> BB:46 => BB:47 probability = 0.94030
#<freq> BB:46 => BB:57 probability = 0.05970
#<freq>
	ldl	$22,440($sp)              	# [0]  gra_spill_temp_47
#<bpre> branch predict not taken
	beq	$22,.Lt_1_152             	# [4]  
#Block: 47 Pred: 46 Succ: 49 
.L_BB47_stencil_core:	# 0x6a4
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:47 frequency = 1.41045 (heuristic)
#<freq>
	ldl	$24,504($sp)              	# [0]  gra_spill_temp_55
	srl	$6,63,$23                 	# [0]  
	addw	$23,$6,$23               	# [1]  
	ldl	$18,496($sp)              	# [1]  gra_spill_temp_54
	sra	$23,1,$23                 	# [2]  
	stl	$31,616($sp)              	# [2]  gra_spill_temp_69
	stl	$23,200($sp)              	# [3]  gra_spill_temp_17
	stl	$24,624($sp)              	# [4]  gra_spill_temp_70
#Block: 49 Pred: 53 47 Succ: 50 53 
.Lt_1_155:	# 0x6c4
#<loop> Loop body line 177, nesting depth: 2, estimated iterations: 2
#<freq>
#<freq> BB:49 frequency = 2.82090 (heuristic)
#<freq> BB:49 => BB:50 probability = 0.92799
#<freq> BB:49 => BB:53 probability = 0.07201
#<freq>
	ldl	$25,576($sp)              	# [0]  gra_spill_temp_64
#<bpre> branch predict not taken
	beq	$25,.Lt_1_156             	# [4]  
#Block: 50 Pred: 49 Succ: 216 
.L_BB50_stencil_core:	# 0x6cc
#<loop> Part of loop body line 177, head labeled .Lt_1_155
#<freq>
#<freq> BB:50 frequency = 2.61775 (heuristic)
#<freq>
	ldl	$8,624($sp)               	# [0]  gra_spill_temp_70
	mov	$31,$23                   	# [0]  
	mov	$18,$24                   	# [1]  
#Block: 216 Pred: 50 Succ: 52 
.L_BB216_stencil_core:	# 0x6d8
#<loop> Part of loop body line 177, head labeled .Lt_1_155
#<freq>
#<freq> BB:216 frequency = 2.61775 (heuristic)
#<freq>
	.loc	1	183	0
# 179    //5.compute core data
# 180    for(i = 1; i < i_region; i++)
# 181       for(j = 1; j < j_region; j++)
# 182          for(k = 1; k < k_region; k++)
# 183              slave[lhs_no][i][j][k] = alpha_d * slave[rhs_no][i][j][k] + \
	fldd	$22,1440($18)            	# [0]  
	fldd	$21,2568($18)            	# [1]  
	fldd	$19,2400($18)            	# [2]  
	fldd	$20,1288($18)            	# [3]  
	fldd	$16,2408($18)            	# [4]  
	fldd	$17,1448($18)            	# [5]  
	fldd	$25,1280($18)            	# [6]  
#Block: 52 Pred: 52 216 Succ: 217 52 
	.align	4
.Lt_1_160:	# 0x6f4
#<loop> Loop body line 177, nesting depth: 3, estimated iterations: 18
#<freq>
#<freq> BB:52 frequency = 47.11957 (heuristic)
#<freq> BB:52 => BB:217 probability = 0.05556
#<freq> BB:52 => BB:52 probability = 0.94444
#<freq>
	fldd	$27,168($24)             	# [0]  id:1389 slave+0x0
	mov	$17,$9                    	# [0]  
	fldd	$26,1128($24)            	# [1]  id:1388 slave+0x0
	mov	$16,$3                    	# [1]  
	fldd	$13,328($24)             	# [2]  id:1405 slave+0x0
	addw	$23,1,$23                	# [2]  
	fldd	$15,3528($24)            	# [3]  id:1398 slave+0x0
	faddd	$27,$16,$27             	# [4]  
	fldd	$11,1608($24)            	# [5]  id:1403 slave+0x0
	faddd	$13,$21,$13             	# [6]  
	fldd	$10,2248($24)            	# [7]  id:1396 slave+0x0
	faddd	$26,$27,$26             	# [11]  
	fldd	$16,2416($24)            	# [12]  id:1393 slave+0x0
	mov	$21,$27                   	# [12]  
	fldd	$2,3688($24)             	# [13]  id:1414 slave+0x0
	faddd	$17,$26,$26             	# [18]  
	fldd	$17,1456($24)            	# [19]  id:1401 slave+0x0
	faddd	$25,$26,$26             	# [25]  
	mov	$20,$25                   	# [26]  
	fldd	$20,1296($24)            	# [26]  id:1385 slave+0x0
	fldd	$1,2728($24)             	# [27]  id:1411 slave+0x0
	faddd	$20,$26,$26             	# [32]  
	fldd	$28,2560($24)            	# [33]  id:1410 slave+0x0
	fmuld	$26,$5,$26              	# [39]  
	fmad	$25,$4,$26,$25           	# [46]  
	cmpeq	$23,$7,$26              	# [46]  
	fstd	$25,1288($8)             	# [56]  id:1391 slave+0x0
	fldd	$25,1288($24)            	# [57]  id:1397 slave+0x0
	faddd	$25,$15,$15             	# [61]  
	faddd	$25,$13,$13             	# [62]  
	faddd	$10,$15,$10             	# [68]  
	faddd	$11,$13,$11             	# [69]  
	faddd	$21,$10,$10             	# [75]  
	fldd	$21,2576($24)            	# [75]  id:1409 slave+0x0
	faddd	$22,$11,$11             	# [76]  
	faddd	$19,$10,$10             	# [82]  
	faddd	$17,$11,$11             	# [83]  
	faddd	$16,$10,$10             	# [89]  
	fmuld	$11,$5,$11              	# [90]  
	fmuld	$10,$5,$10              	# [96]  
	fmad	$9,$4,$11,$9             	# [97]  
	fmad	$3,$4,$10,$3             	# [103]  
	fstd	$9,1448($8)              	# [107]  id:1407 slave+0x0
	fldd	$22,1448($24)            	# [108]  id:1413 slave+0x0
	faddd	$22,$2,$2               	# [112]  
	fstd	$3,2408($8)              	# [117]  id:1399 slave+0x0
	fldd	$19,2408($24)            	# [118]  id:1412 slave+0x0
	ldi	$24,8($24)                	# [118]  
	faddd	$19,$2,$2               	# [122]  
	faddd	$1,$2,$1                	# [129]  
	faddd	$28,$1,$28              	# [136]  
	faddd	$21,$28,$28             	# [143]  
	fmuld	$28,$5,$28              	# [150]  
	fmad	$27,$4,$28,$27           	# [157]  
	fstd	$27,2568($8)             	# [167]  id:1415 slave+0x0
	ldi	$8,8($8)                  	# [167]  
#<bpre> branch predict taken
	beq	$26,.Lt_1_160             	# [168]  
#Block: 217 Pred: 52 Succ: 53 
.L_BB217_stencil_core:	# 0x7d8
#<loop> Part of loop body line 177, head labeled .Lt_1_155
#<freq>
#<freq> BB:217 frequency = 2.61775 (heuristic)
#<freq>
#Block: 53 Pred: 217 49 Succ: 54 49 
.Lt_1_156:	# 0x7d8
#<loop> Part of loop body line 177, head labeled .Lt_1_155
#<freq>
#<freq> BB:53 frequency = 2.82090 (heuristic)
#<freq> BB:53 => BB:54 probability = 0.50000
#<freq> BB:53 => BB:49 probability = 0.50000
#<freq>
	ldl	$28,616($sp)              	# [0]  gra_spill_temp_69
	ldi	$18,320($18)              	# [0]  
	ldl	$1,472($sp)               	# [1]  gra_spill_temp_51
	addw	$28,2,$28                	# [4]  
	stl	$28,616($sp)              	# [5]  gra_spill_temp_69
	cmple	$28,$1,$28              	# [8]  
	ldl	$1,624($sp)               	# [9]  gra_spill_temp_70
	ldi	$1,320($1)                	# [13]  
	stl	$1,624($sp)               	# [14]  gra_spill_temp_70
#<bpre> branch predict unknown
	bne	$28,.Lt_1_155             	# [15]  
#Block: 54 Pred: 53 Succ: 55 68 
.L_BB54_stencil_core:	# 0x800
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:54 frequency = 1.41045 (heuristic)
#<freq> BB:54 => BB:55 probability = 0.84000
#<freq> BB:54 => BB:68 probability = 0.16000
#<freq>
	ldl	$2,576($sp)               	# [0]  gra_spill_temp_64
#<bpre> branch predict not taken
	beq	$2,.Lt_1_165              	# [4]  
#Block: 55 Pred: 54 Succ: 68 56 
.L_BB55_stencil_core:	# 0x808
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:55 frequency = 1.18478 (heuristic)
#<freq> BB:55 => BB:68 probability = 0.25000
#<freq> BB:55 => BB:56 probability = 0.75000
#<freq>
	ldl	$3,616($sp)               	# [0]  gra_spill_temp_69
	ldl	$8,432($sp)               	# [1]  gra_spill_temp_46
	cmple	$3,$8,$3                	# [5]  
#<bpre> branch predict not taken
	beq	$3,.Lt_1_165              	# [6]  
#Block: 56 Pred: 55 58 Succ: 64 
.Lt_1_306:	# 0x818
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:56 frequency = 0.95177 (heuristic)
#<freq>
	ldl	$15,616($sp)              	# [0]  gra_spill_temp_69
	ldl	$16,480($sp)              	# [1]  gra_spill_temp_52
	s4addl	$15,$15,$11            	# [4]  
	ldl	$10,720($sp)              	# [5]  gra_spill_temp_82
	s4addl	$11,$16,$11            	# [8]  
	ldl	$16,704($sp)              	# [9]  gra_spill_temp_80
	addl	$11,$10,$10              	# [12]  
	addl	$11,$16,$11              	# [16]  
	ldl	$16,712($sp)              	# [16]  gra_spill_temp_81
	s8addl	$10,$16,$10            	# [20]  
	s8addl	$11,$16,$11            	# [20]  
#Block: 64 Pred: 67 56 Succ: 218 
.Lt_1_169:	# 0x844
#<loop> Loop body line 183, nesting depth: 2, estimated iterations: 1
#<freq>
#<freq> BB:64 frequency = 0.95177 (heuristic)
#<freq>
	mov	$31,$20                   	# [0]  
	mov	$10,$21                   	# [0]  
	mov	$11,$16                   	# [1]  
#Block: 218 Pred: 64 Succ: 222 221 
.L_BB218_stencil_core:	# 0x850
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<freq>
#<freq> BB:218 frequency = 0.95177 (heuristic)
#<freq> BB:218 => BB:222 probability = 0.50000
#<freq> BB:218 => BB:221 probability = 0.50000
#<freq>
	fldd	$23,1288($10)            	# [0]  
	and	$7,1,$18                  	# [0]  
	fldd	$24,2408($10)            	# [1]  
	mov	$23,$17                   	# [4]  
	fldd	$22,1280($10)            	# [5]  
	mov	$24,$19                   	# [8]  
	mov	$22,$8                    	# [12]  
#<bpre> branch predict unknown
	beq	$18,.L_BB221_stencil_core 	# [12]  
#Block: 222 Pred: 218 Succ: 221 
.L_BB222_stencil_core:	# 0x870
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<loop> Unrolling remainder loop (at most 1 iteration)
#<freq>
#<freq> BB:222 frequency = 0.47589 (heuristic)
#<freq>
	fldd	$2,168($10)              	# [0]  id:1421 slave+0x0
	ldi	$16,8($11)                	# [0]  
	fldd	$1,1128($10)             	# [1]  id:1420 slave+0x0
	faddd	$2,$24,$2               	# [4]  
	fldd	$28,1448($10)            	# [5]  id:1419 slave+0x0
	faddd	$1,$2,$1                	# [11]  
	fldd	$17,1296($10)            	# [12]  id:1417 slave+0x0
	faddd	$28,$1,$28              	# [18]  
	fldd	$27,3528($10)            	# [19]  id:1430 slave+0x0
	faddd	$22,$28,$28             	# [25]  
	fldd	$25,2248($10)            	# [26]  id:1428 slave+0x0
	faddd	$17,$28,$28             	# [32]  
	fldd	$21,2568($10)            	# [33]  id:1427 slave+0x0
	fmuld	$28,$5,$28              	# [39]  
	fldd	$20,2400($10)            	# [40]  id:1426 slave+0x0
	fmad	$23,$4,$28,$28           	# [46]  
	fldd	$19,2416($10)            	# [47]  id:1425 slave+0x0
	fstd	$28,1288($11)            	# [56]  id:1423 slave+0x0
	fldd	$8,1288($10)             	# [57]  id:1429 slave+0x0
	faddd	$8,$27,$27              	# [61]  
	faddd	$25,$27,$25             	# [68]  
	faddd	$21,$25,$21             	# [75]  
	faddd	$20,$21,$20             	# [82]  
	ldi	$21,8($10)                	# [82]  
	faddd	$19,$20,$20             	# [89]  
	fmuld	$20,$5,$20              	# [96]  
	fmad	$24,$4,$20,$20           	# [103]  
	fstd	$20,2408($11)            	# [113]  id:1431 slave+0x0
	addw	$31,1,$20                	# [113]  
#Block: 221 Pred: 218 222 Succ: 224 223 
.L_BB221_stencil_core:	# 0x8e4
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<freq>
#<freq> BB:221 frequency = 0.95177 (heuristic)
#<freq> BB:221 => BB:224 probability = 0.88889
#<freq> BB:221 => BB:223 probability = 0.11111
#<freq>
	sra	$7,1,$26                  	# [0]  
#<bpre> branch predict not taken
	beq	$26,.L_BB223_stencil_core 	# [1]  
#Block: 224 Pred: 221 Succ: 220 
.L_BB224_stencil_core:	# 0x8ec
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<freq>
#<freq> BB:224 frequency = 0.84602 (heuristic)
#<freq>
#Block: 220 Pred: 220 224 Succ: 220 225 
	.align	4
.L_BB220_stencil_core:	# 0x8ec
#<loop> Loop body line 183, nesting depth: 3, estimated iterations: 9
#<loop> unrolled 2 times
#<freq>
#<freq> BB:220 frequency = 4.75885 (heuristic)
#<freq> BB:220 => BB:220 probability = 0.88889
#<freq> BB:220 => BB:225 probability = 0.11111
#<freq>
	fldd	$2,168($21)              	# [0]  id:1421 slave+0x0
	addw	$20,2,$20                	# [0]  
	fldd	$1,1128($21)             	# [1]  id:1420 slave+0x0
	cmpeq	$20,$7,$3               	# [1]  
	fldd	$28,1448($21)            	# [2]  id:1419 slave+0x0
	faddd	$2,$19,$2               	# [4]  
	fldd	$27,1296($21)            	# [5]  id:1417 slave+0x0
	faddd	$1,$2,$1                	# [11]  
	fldd	$23,176($21)             	# [12]  id:1421 slave+0x0
	faddd	$28,$1,$28              	# [18]  
	fldd	$9,2416($21)             	# [19]  id:1425 slave+0x0
	faddd	$8,$28,$28              	# [25]  
	fldd	$22,1136($21)            	# [26]  id:1420 slave+0x0
	faddd	$23,$9,$23              	# [29]  
	fldd	$18,1456($21)            	# [30]  id:1419 slave+0x0
	faddd	$27,$28,$28             	# [32]  
	fldd	$8,3528($21)             	# [33]  id:1430 slave+0x0
	faddd	$22,$23,$22             	# [36]  
	fldd	$2,2248($21)             	# [37]  id:1428 slave+0x0
	fmuld	$28,$5,$28              	# [39]  
	fldd	$1,2568($21)             	# [40]  id:1427 slave+0x0
	faddd	$18,$22,$18             	# [43]  
	fldd	$24,2400($21)            	# [44]  id:1426 slave+0x0
	fmad	$17,$4,$28,$28           	# [46]  
	fldd	$17,1304($21)            	# [47]  id:1417 slave+0x0
	fldd	$25,3536($21)            	# [48]  id:1430 slave+0x0
	fldd	$23,2256($21)            	# [49]  id:1428 slave+0x0
	fldd	$22,2576($21)            	# [50]  id:1427 slave+0x0
	fstd	$28,1288($16)            	# [56]  id:1423 slave+0x0
	fldd	$28,1288($21)            	# [57]  id:1429 slave+0x0
	faddd	$28,$8,$8               	# [61]  
	faddd	$28,$18,$28             	# [62]  
	faddd	$2,$8,$2                	# [68]  
	faddd	$17,$28,$28             	# [69]  
	faddd	$1,$2,$1                	# [75]  
	fmuld	$28,$5,$28              	# [76]  
	faddd	$24,$1,$24              	# [82]  
	fmad	$27,$4,$28,$27           	# [83]  
	faddd	$9,$24,$24              	# [89]  
	fstd	$27,1296($16)            	# [93]  id:1423 slave+0x0
	fldd	$8,1296($21)             	# [94]  id:1429 slave+0x0
	fmuld	$24,$5,$24              	# [100]  
	faddd	$8,$25,$25              	# [104]  
	fmad	$19,$4,$24,$24           	# [107]  
	fldd	$19,2424($21)            	# [107]  id:1425 slave+0x0
	faddd	$23,$25,$23             	# [111]  
	fstd	$24,2408($16)            	# [117]  id:1431 slave+0x0
	fldd	$18,2408($21)            	# [118]  id:1426 slave+0x0
	ldi	$21,16($21)               	# [118]  
	faddd	$22,$23,$22             	# [124]  
	faddd	$18,$22,$18             	# [131]  
	faddd	$19,$18,$18             	# [138]  
	fmuld	$18,$5,$18              	# [145]  
	fmad	$9,$4,$18,$9             	# [152]  
	fstd	$9,2416($16)             	# [162]  id:1431 slave+0x0
	ldi	$16,16($16)               	# [162]  
#<bpre> branch predict taken
	beq	$3,.L_BB220_stencil_core  	# [163]  
#Block: 225 Pred: 220 Succ: 223 
.L_BB225_stencil_core:	# 0x9d0
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<freq>
#<freq> BB:225 frequency = 0.52876 (heuristic)
#<freq>
#Block: 223 Pred: 221 225 Succ: 219 
.L_BB223_stencil_core:	# 0x9d0
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<freq>
#<freq> BB:223 frequency = 0.00000 (heuristic)
#<freq>
#Block: 219 Pred: 223 Succ: 67 
.L_BB219_stencil_core:	# 0x9d0
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<freq>
#<freq> BB:219 frequency = 0.95177 (heuristic)
#<freq>
#Block: 67 Pred: 219 Succ: 68 64 
.L_BB67_stencil_core:	# 0x9d0
#<loop> Part of loop body line 183, head labeled .Lt_1_169
#<freq>
#<freq> BB:67 frequency = 0.95177 (heuristic)
#<freq> BB:67 => BB:68 probability = 1.00000
#<freq> BB:67 => BB:64 probability = 0.00000
#<freq>
	addw	$15,1,$15                	# [0]  
	ldi	$10,160($10)              	# [0]  
	cmpeq	$15,$6,$3               	# [1]  
	ldi	$11,160($11)              	# [1]  
#<bpre> branch predict not taken
	beq	$3,.Lt_1_169.bpre         	# [2]  
#Block: 68 Pred: 67 54 55 57 317 Succ: 69 46 
.Lt_1_165:	# 0x9e4
.Lt_1_163:	# 0x9e4
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:68 frequency = 1.50000 (heuristic)
#<freq> BB:68 => BB:69 probability = 0.50000
#<freq> BB:68 => BB:46 probability = 0.50000
#<freq>
	ldl	$17,496($sp)              	# [0]  gra_spill_temp_54
	ldl	$8,512($sp)               	# [1]  gra_spill_temp_56
	ldi	$17,2240($17)             	# [4]  
	ldl	$16,488($sp)              	# [5]  gra_spill_temp_53
	addw	$8,2,$8                  	# [8]  
	stl	$8,512($sp)               	# [9]  gra_spill_temp_56
	cmple	$8,$16,$8               	# [12]  
	ldl	$16,480($sp)              	# [13]  gra_spill_temp_52
	stl	$17,496($sp)              	# [14]  gra_spill_temp_54
	ldi	$16,280($16)              	# [17]  
	ldl	$17,504($sp)              	# [18]  gra_spill_temp_55
	stl	$16,480($sp)              	# [19]  gra_spill_temp_52
	ldi	$17,2240($17)             	# [22]  
	stl	$17,504($sp)              	# [23]  gra_spill_temp_55
#<bpre> branch predict unknown
	bne	$8,.Lt_1_150              	# [24]  
#Block: 69 Pred: 68 Succ: 70 74 
.L_BB69_stencil_core:	# 0xa20
#<freq>
#<freq> BB:69 frequency = 0.75000 (heuristic)
#<freq> BB:69 => BB:70 probability = 0.50000
#<freq> BB:69 => BB:74 probability = 0.50000
#<freq>
	ldl	$18,512($sp)              	# [0]  gra_spill_temp_56
	subw	$14,3,$19                	# [0]  
	cmple	$18,$19,$18             	# [4]  
#<bpre> branch predict unknown
	beq	$18,.Lt_1_321             	# [5]  
#Block: 70 Pred: 69 Succ: 71 
.L_BB70_stencil_core:	# 0xa30
#<freq>
#<freq> BB:70 frequency = 0.37500 (heuristic)
#<freq>
	mov	3,$20                     	# [0]  
	cmple	$20,$14,$20             	# [1]  
	stl	$20,552($sp)              	# [2]  gra_spill_temp_61
#Block: 71 Pred: 70 73 Succ: 81 
.Lt_1_307:	# 0xa3c
#<freq>
#<freq> BB:71 frequency = 0.50000 (heuristic)
#<freq>
	ldl	$18,512($sp)              	# [0]  gra_spill_temp_56
	ldl	$15,704($sp)              	# [1]  gra_spill_temp_80
	subw	$14,$18,$27              	# [4]  
	subw	$27,2,$27                	# [5]  
	ldl	$26,720($sp)              	# [5]  gra_spill_temp_82
	stl	$27,80($sp)               	# [6]  gra_spill_temp_2
	sll	$18,2,$13                 	# [6]  
	ldl	$27,712($sp)              	# [7]  gra_spill_temp_81
	s8subl	$13,$13,$13            	# [7]  
	s4addl	$13,$13,$13            	# [8]  
	addl	$13,$26,$26              	# [9]  
	addl	$13,$15,$15              	# [9]  
	s8addl	$15,$27,$15            	# [11]  
	s8addl	$26,$27,$26            	# [11]  
#Block: 81 Pred: 103 71 Succ: 82 92 
.Lt_1_180:	# 0xa74
#<loop> Loop body line 183, nesting depth: 1, estimated iterations: 1
#<freq>
#<freq> BB:81 frequency = 0.50000 (heuristic)
#<freq> BB:81 => BB:82 probability = 0.94030
#<freq> BB:81 => BB:92 probability = 0.05970
#<freq>
	ldl	$16,440($sp)              	# [0]  gra_spill_temp_47
#<bpre> branch predict not taken
	beq	$16,.Lt_1_182             	# [4]  
#Block: 82 Pred: 81 Succ: 84 
.L_BB82_stencil_core:	# 0xa7c
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:82 frequency = 0.47015 (heuristic)
#<freq>
	srl	$6,63,$17                 	# [0]  
	mov	$31,$11                   	# [0]  
	addw	$17,$6,$17               	# [1]  
	mov	$26,$9                    	# [1]  
	sra	$17,1,$17                 	# [2]  
	mov	$15,$10                   	# [2]  
	stl	$17,72($sp)               	# [3]  gra_spill_temp_1
#Block: 84 Pred: 88 82 Succ: 85 88 
.Lt_1_185:	# 0xa98
#<loop> Loop body line 183, nesting depth: 2, estimated iterations: 2
#<freq>
#<freq> BB:84 frequency = 0.94030 (heuristic)
#<freq> BB:84 => BB:85 probability = 0.92799
#<freq> BB:84 => BB:88 probability = 0.07201
#<freq>
	ldl	$19,576($sp)              	# [0]  gra_spill_temp_64
#<bpre> branch predict not taken
	beq	$19,.Lt_1_186             	# [4]  
#Block: 85 Pred: 84 Succ: 226 
.L_BB85_stencil_core:	# 0xaa0
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:85 frequency = 0.87258 (heuristic)
#<freq>
	mov	$31,$21                   	# [0]  
	mov	$9,$20                    	# [0]  
	mov	$10,$8                    	# [1]  
#Block: 226 Pred: 85 Succ: 230 229 
.L_BB226_stencil_core:	# 0xaac
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:226 frequency = 0.87258 (heuristic)
#<freq> BB:226 => BB:230 probability = 0.50000
#<freq> BB:226 => BB:229 probability = 0.50000
#<freq>
	fldd	$24,1288($9)             	# [0]  
	and	$7,1,$25                  	# [0]  
	fldd	$22,1448($9)             	# [1]  
	mov	$24,$17                   	# [4]  
	fldd	$23,1280($9)             	# [5]  
	mov	$22,$19                   	# [8]  
	mov	$23,$16                   	# [12]  
#<bpre> branch predict unknown
	beq	$25,.L_BB229_stencil_core 	# [12]  
#Block: 230 Pred: 226 Succ: 229 
.L_BB230_stencil_core:	# 0xacc
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<loop> Unrolling remainder loop (at most 1 iteration)
#<freq>
#<freq> BB:230 frequency = 0.43629 (heuristic)
#<freq>
	fldd	$16,2408($9)             	# [0]  id:1438 slave+0x0
	ldi	$20,8($9)                 	# [0]  
	fldd	$8,168($9)               	# [1]  id:1437 slave+0x0
	addw	$31,1,$21                	# [1]  
	fldd	$3,1128($9)              	# [2]  id:1436 slave+0x0
	faddd	$8,$16,$8               	# [5]  
	fldd	$17,1296($9)             	# [6]  id:1433 slave+0x0
	faddd	$3,$8,$3                	# [12]  
	fldd	$2,2568($9)              	# [13]  id:1446 slave+0x0
	ldi	$8,8($10)                 	# [13]  
	fldd	$1,328($9)               	# [14]  id:1445 slave+0x0
	faddd	$22,$3,$3               	# [19]  
	fldd	$28,1608($9)             	# [20]  id:1443 slave+0x0
	faddd	$1,$2,$1                	# [23]  
	fldd	$27,1440($9)             	# [24]  id:1442 slave+0x0
	faddd	$23,$3,$3               	# [26]  
	fldd	$19,1456($9)             	# [27]  id:1441 slave+0x0
	faddd	$17,$3,$3               	# [33]  
	fmuld	$3,$5,$3                	# [40]  
	fmad	$24,$4,$3,$3             	# [47]  
	fstd	$3,1288($10)             	# [57]  id:1439 slave+0x0
	fldd	$16,1288($9)             	# [58]  id:1444 slave+0x0
	faddd	$16,$1,$1               	# [62]  
	faddd	$28,$1,$28              	# [69]  
	faddd	$27,$28,$27             	# [76]  
	faddd	$19,$27,$27             	# [83]  
	fmuld	$27,$5,$27              	# [90]  
	fmad	$22,$4,$27,$27           	# [97]  
	fstd	$27,1448($10)            	# [107]  id:1447 slave+0x0
#Block: 229 Pred: 226 230 Succ: 232 231 
.L_BB229_stencil_core:	# 0xb40
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:229 frequency = 0.87258 (heuristic)
#<freq> BB:229 => BB:232 probability = 0.88889
#<freq> BB:229 => BB:231 probability = 0.11111
#<freq>
	sra	$7,1,$22                  	# [0]  
#<bpre> branch predict not taken
	beq	$22,.L_BB231_stencil_core 	# [1]  
#Block: 232 Pred: 229 Succ: 228 
.L_BB232_stencil_core:	# 0xb48
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:232 frequency = 0.77563 (heuristic)
#<freq>
	stl	$22,736($sp)              	# [0]  gra_spill_temp_84
#Block: 228 Pred: 228 232 Succ: 228 233 
	.align	4
.L_BB228_stencil_core:	# 0xb4c
#<loop> Loop body line 183, nesting depth: 3, estimated iterations: 9
#<loop> unrolled 2 times
#<freq>
#<freq> BB:228 frequency = 4.36292 (heuristic)
#<freq> BB:228 => BB:228 probability = 0.88889
#<freq> BB:228 => BB:233 probability = 0.11111
#<freq>
	fldd	$22,2408($20)            	# [0]  id:1438 slave+0x0
	addw	$21,2,$21                	# [0]  
	fldd	$3,168($20)              	# [1]  id:1437 slave+0x0
	fldd	$2,1128($20)             	# [2]  id:1436 slave+0x0
	faddd	$3,$22,$3               	# [5]  
	fldd	$24,1296($20)            	# [6]  id:1433 slave+0x0
	faddd	$2,$3,$2                	# [12]  
	fldd	$1,2416($20)             	# [13]  id:1438 slave+0x0
	faddd	$19,$2,$2               	# [19]  
	fldd	$28,176($20)             	# [20]  id:1437 slave+0x0
	faddd	$16,$2,$2               	# [26]  
	fldd	$27,1136($20)            	# [27]  id:1436 slave+0x0
	faddd	$28,$1,$28              	# [30]  
	fldd	$1,1456($20)             	# [31]  id:1441 slave+0x0
	faddd	$24,$2,$2               	# [33]  
	fldd	$3,2568($20)             	# [34]  id:1446 slave+0x0
	faddd	$27,$28,$27             	# [37]  
	fldd	$28,328($20)             	# [38]  id:1445 slave+0x0
	fmuld	$2,$5,$2                	# [40]  
	fldd	$23,1440($20)            	# [41]  id:1442 slave+0x0
	faddd	$28,$3,$28              	# [44]  
	faddd	$1,$27,$27              	# [45]  
	fldd	$22,336($20)             	# [45]  id:1445 slave+0x0
	fldd	$3,1616($20)             	# [46]  id:1443 slave+0x0
	fmad	$17,$4,$2,$2             	# [47]  
	fldd	$17,1304($20)            	# [48]  id:1433 slave+0x0
	fstd	$2,1288($8)              	# [57]  id:1439 slave+0x0
	fldd	$25,1288($20)            	# [58]  id:1444 slave+0x0
	faddd	$25,$28,$28             	# [62]  
	faddd	$25,$27,$25             	# [63]  
	fldd	$27,1608($20)            	# [63]  id:1443 slave+0x0
	faddd	$27,$28,$27             	# [69]  
	cmpeq	$21,$7,$28              	# [69]  
	faddd	$17,$25,$25             	# [70]  
	faddd	$23,$27,$23             	# [76]  
	fmuld	$25,$5,$25              	# [77]  
	faddd	$1,$23,$23              	# [83]  
	fmad	$24,$4,$25,$24           	# [84]  
	fldd	$25,2576($20)            	# [84]  id:1446 slave+0x0
	faddd	$22,$25,$22             	# [88]  
	fstd	$24,1296($8)             	# [94]  id:1439 slave+0x0
	fmuld	$23,$5,$23              	# [95]  
	fldd	$16,1296($20)            	# [95]  id:1444 slave+0x0
	faddd	$16,$22,$22             	# [99]  
	fmad	$19,$4,$23,$19           	# [102]  
	faddd	$3,$22,$3               	# [106]  
	fstd	$19,1448($8)             	# [112]  id:1447 slave+0x0
	fldd	$2,1448($20)             	# [113]  id:1442 slave+0x0
	fldd	$19,1464($20)            	# [114]  id:1441 slave+0x0
	ldi	$20,16($20)               	# [114]  
	faddd	$2,$3,$2                	# [117]  
	faddd	$19,$2,$2               	# [124]  
	fmuld	$2,$5,$2                	# [131]  
	fmad	$1,$4,$2,$1              	# [138]  
	fstd	$1,1456($8)              	# [148]  id:1447 slave+0x0
	ldi	$8,16($8)                 	# [148]  
#<bpre> branch predict taken
	beq	$28,.L_BB228_stencil_core 	# [149]  
#Block: 233 Pred: 228 Succ: 231 
.L_BB233_stencil_core:	# 0xc30
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:233 frequency = 0.48477 (heuristic)
#<freq>
#Block: 231 Pred: 229 233 Succ: 227 
.L_BB231_stencil_core:	# 0xc30
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:231 frequency = 0.00000 (heuristic)
#<freq>
#Block: 227 Pred: 231 Succ: 88 
.L_BB227_stencil_core:	# 0xc30
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:227 frequency = 0.87258 (heuristic)
#<freq>
#Block: 88 Pred: 227 84 Succ: 89 84 
.Lt_1_186:	# 0xc30
#<loop> Part of loop body line 183, head labeled .Lt_1_185
#<freq>
#<freq> BB:88 frequency = 0.94030 (heuristic)
#<freq> BB:88 => BB:89 probability = 0.50000
#<freq> BB:88 => BB:84 probability = 0.50000
#<freq>
	ldl	$23,472($sp)              	# [0]  gra_spill_temp_51
	addw	$11,2,$11                	# [0]  
	ldi	$10,320($10)              	# [1]  
	ldi	$9,320($9)                	# [1]  
	cmple	$11,$23,$23             	# [4]  
#<bpre> branch predict unknown
	bne	$23,.Lt_1_185             	# [5]  
#Block: 89 Pred: 88 Succ: 90 103 
.L_BB89_stencil_core:	# 0xc48
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:89 frequency = 0.47015 (heuristic)
#<freq> BB:89 => BB:90 probability = 0.84000
#<freq> BB:89 => BB:103 probability = 0.16000
#<freq>
	ldl	$24,576($sp)              	# [0]  gra_spill_temp_64
#<bpre> branch predict not taken
	beq	$24,.Lt_1_195             	# [4]  
#Block: 90 Pred: 89 Succ: 103 91 
.L_BB90_stencil_core:	# 0xc50
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:90 frequency = 0.39493 (heuristic)
#<freq> BB:90 => BB:103 probability = 0.25000
#<freq> BB:90 => BB:91 probability = 0.75000
#<freq>
	ldl	$25,432($sp)              	# [0]  gra_spill_temp_46
	cmple	$11,$25,$25             	# [4]  
#<bpre> branch predict not taken
	beq	$25,.Lt_1_195             	# [5]  
#Block: 91 Pred: 90 93 Succ: 99 
.Lt_1_308:	# 0xc5c
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:91 frequency = 0.31726 (heuristic)
#<freq>
	ldl	$22,704($sp)              	# [0]  gra_spill_temp_80
	s4addl	$11,$11,$21            	# [0]  
	ldl	$20,720($sp)              	# [1]  gra_spill_temp_82
	s4addl	$21,$13,$21            	# [1]  
	addl	$21,$20,$20              	# [5]  
	addl	$21,$22,$21              	# [5]  
	ldl	$22,712($sp)              	# [6]  gra_spill_temp_81
	s8addl	$21,$22,$21            	# [10]  
	s8addl	$20,$22,$20            	# [10]  
#Block: 99 Pred: 102 91 Succ: 234 
.Lt_1_199:	# 0xc80
#<loop> Loop body line 183, nesting depth: 2, estimated iterations: 1
#<freq>
#<freq> BB:99 frequency = 0.31726 (heuristic)
#<freq>
	mov	$31,$17                   	# [0]  
	mov	$20,$16                   	# [0]  
	mov	$21,$8                    	# [1]  
#Block: 234 Pred: 99 Succ: 238 237 
.L_BB234_stencil_core:	# 0xc8c
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:234 frequency = 0.31726 (heuristic)
#<freq> BB:234 => BB:238 probability = 0.75000
#<freq> BB:234 => BB:237 probability = 0.25000
#<freq>
	fldd	$23,1288($20)            	# [0]  
	and	$7,3,$22                  	# [0]  
	mov	$23,$19                   	# [4]  
#<bpre> branch predict not taken
	beq	$22,.L_BB237_stencil_core 	# [4]  
#Block: 238 Pred: 234 Succ: 237 239 
.L_BB238_stencil_core:	# 0xc9c
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<loop> Unrolling remainder loop (at most 3 iterations)
#<freq>
#<freq> BB:238 frequency = 0.23794 (heuristic)
#<freq> BB:238 => BB:237 probability = 0.33333
#<freq> BB:238 => BB:239 probability = 0.66667
#<freq>
	fldd	$8,2408($20)             	# [0]  id:1454 slave+0x0
	subw	$22,1,$22                	# [0]  
	fldd	$3,168($20)              	# [1]  id:1453 slave+0x0
	ldi	$16,8($20)                	# [1]  
	fldd	$2,1128($20)             	# [2]  id:1452 slave+0x0
	addw	$31,1,$17                	# [2]  
	fldd	$1,1448($20)             	# [3]  id:1451 slave+0x0
	faddd	$3,$8,$3                	# [5]  
	fldd	$28,1280($20)            	# [6]  id:1450 slave+0x0
	ldi	$8,8($21)                 	# [6]  
	fldd	$19,1296($20)            	# [7]  id:1449 slave+0x0
	faddd	$2,$3,$2                	# [12]  
	faddd	$1,$2,$1                	# [19]  
	faddd	$28,$1,$28              	# [26]  
	faddd	$19,$28,$28             	# [33]  
	fmuld	$28,$5,$28              	# [40]  
	fmad	$23,$4,$28,$28           	# [47]  
	fstd	$28,1288($21)            	# [57]  id:1455 slave+0x0
#<bpre> branch predict not taken
	beq	$22,.L_BB237_stencil_core 	# [58]  
#Block: 239 Pred: 238 Succ: 237 240 
.L_BB239_stencil_core:	# 0xce8
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:239 frequency = 0.15863 (heuristic)
#<freq> BB:239 => BB:237 probability = 0.50000
#<freq> BB:239 => BB:240 probability = 0.50000
#<freq>
	fldd	$3,2416($20)             	# [0]  id:1454 slave+0x0
	mov	$19,$24                   	# [0]  
	fldd	$2,176($20)              	# [1]  id:1453 slave+0x0
	subw	$22,1,$23                	# [1]  
	fldd	$1,1136($20)             	# [2]  id:1452 slave+0x0
	ldi	$16,16($20)               	# [2]  
	fldd	$28,1456($20)            	# [3]  id:1451 slave+0x0
	ldi	$8,16($21)                	# [3]  
	fldd	$25,1288($20)            	# [4]  id:1450 slave+0x0
	mov	2,$17                     	# [4]  
	faddd	$2,$3,$2                	# [5]  
	fldd	$19,1304($20)            	# [5]  id:1449 slave+0x0
	faddd	$1,$2,$1                	# [12]  
	faddd	$28,$1,$28              	# [19]  
	faddd	$25,$28,$25             	# [26]  
	faddd	$19,$25,$25             	# [33]  
	fmuld	$25,$5,$25              	# [40]  
	fmad	$24,$4,$25,$24           	# [47]  
	fstd	$24,1296($21)            	# [57]  id:1455 slave+0x0
#<bpre> branch predict unknown
	beq	$23,.L_BB237_stencil_core 	# [58]  
#Block: 240 Pred: 239 Succ: 237 
.L_BB240_stencil_core:	# 0xd38
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:240 frequency = 0.07931 (heuristic)
#<freq>
	fldd	$24,2424($20)            	# [0]  id:1454 slave+0x0
	mov	$19,$8                    	# [0]  
	fldd	$23,184($20)             	# [1]  id:1453 slave+0x0
	fldd	$22,1144($20)            	# [2]  id:1452 slave+0x0
	faddd	$23,$24,$23             	# [5]  
	fldd	$17,1464($20)            	# [6]  id:1451 slave+0x0
	faddd	$22,$23,$22             	# [12]  
	fldd	$16,1296($20)            	# [13]  id:1450 slave+0x0
	faddd	$17,$22,$17             	# [19]  
	fldd	$19,1312($20)            	# [20]  id:1449 slave+0x0
	faddd	$16,$17,$16             	# [26]  
	mov	3,$17                     	# [27]  
	faddd	$19,$16,$16             	# [33]  
	fmuld	$16,$5,$16              	# [40]  
	fmad	$8,$4,$16,$8             	# [47]  
	ldi	$16,24($20)               	# [47]  
	fstd	$8,1304($21)             	# [57]  id:1455 slave+0x0
	ldi	$8,24($21)                	# [57]  
#Block: 237 Pred: 234 238 239 240 Succ: 242 241 
.L_BB237_stencil_core:	# 0xd80
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:237 frequency = 0.31726 (heuristic)
#<freq> BB:237 => BB:242 probability = 0.75000
#<freq> BB:237 => BB:241 probability = 0.25000
#<freq>
	sra	$7,2,$28                  	# [0]  
#<bpre> branch predict not taken
	beq	$28,.L_BB241_stencil_core 	# [1]  
#Block: 242 Pred: 237 Succ: 236 
.L_BB242_stencil_core:	# 0xd88
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:242 frequency = 0.23794 (heuristic)
#<freq>
#Block: 236 Pred: 236 242 Succ: 236 243 
.L_BB236_stencil_core:	# 0xd88
#<loop> Loop body line 183, nesting depth: 3, estimated iterations: 4
#<loop> unrolled 4 times
#<freq>
#<freq> BB:236 frequency = 0.99143 (heuristic)
#<freq> BB:236 => BB:236 probability = 0.75000
#<freq> BB:236 => BB:243 probability = 0.25000
#<freq>
	fldd	$22,2408($16)            	# [0]  id:1454 slave+0x0
	addw	$17,4,$17                	# [0]  
	fldd	$3,168($16)              	# [1]  id:1453 slave+0x0
	fldd	$2,1128($16)             	# [2]  id:1452 slave+0x0
	faddd	$3,$22,$3               	# [5]  
	fldd	$1,1448($16)             	# [6]  id:1451 slave+0x0
	faddd	$2,$3,$2                	# [12]  
	fldd	$25,1280($16)            	# [13]  id:1450 slave+0x0
	faddd	$1,$2,$1                	# [19]  
	fldd	$23,1296($16)            	# [20]  id:1449 slave+0x0
	faddd	$25,$1,$25              	# [26]  
	fldd	$1,2416($16)             	# [27]  id:1454 slave+0x0
	faddd	$23,$25,$25             	# [33]  
	fldd	$24,176($16)             	# [34]  id:1453 slave+0x0
	fmuld	$25,$5,$25              	# [40]  
	fldd	$22,1136($16)            	# [41]  id:1452 slave+0x0
	faddd	$24,$1,$24              	# [44]  
	fldd	$3,1456($16)             	# [45]  id:1451 slave+0x0
	fmad	$19,$4,$25,$19           	# [47]  
	fldd	$1,184($16)              	# [48]  id:1453 slave+0x0
	faddd	$22,$24,$22             	# [51]  
	fldd	$25,192($16)             	# [52]  id:1453 slave+0x0
	faddd	$3,$22,$3               	# [58]  
	fstd	$19,1288($8)             	# [59]  id:1455 slave+0x0
	fldd	$2,1288($16)             	# [60]  id:1450 slave+0x0
	fldd	$19,2424($16)            	# [61]  id:1454 slave+0x0
	faddd	$2,$3,$2                	# [65]  
	fldd	$3,1304($16)             	# [66]  id:1449 slave+0x0
	faddd	$1,$19,$1               	# [69]  
	fldd	$19,2432($16)            	# [70]  id:1454 slave+0x0
	faddd	$3,$2,$2                	# [73]  
	fldd	$24,1144($16)            	# [74]  id:1452 slave+0x0
	faddd	$25,$19,$25             	# [77]  
	fldd	$19,1152($16)            	# [78]  id:1452 slave+0x0
	fmuld	$2,$5,$2                	# [80]  
	faddd	$24,$1,$24              	# [81]  
	fldd	$22,1464($16)            	# [81]  id:1451 slave+0x0
	faddd	$19,$25,$19             	# [84]  
	fldd	$25,1312($16)            	# [84]  id:1449 slave+0x0
	fmad	$23,$4,$2,$23            	# [87]  
	fldd	$2,1472($16)             	# [87]  id:1451 slave+0x0
	faddd	$22,$24,$22             	# [88]  
	cmpeq	$17,$7,$24              	# [88]  
	faddd	$2,$19,$2               	# [91]  
	fstd	$23,1296($8)             	# [97]  id:1455 slave+0x0
	fldd	$19,1296($16)            	# [98]  id:1450 slave+0x0
	faddd	$19,$22,$19             	# [102]  
	faddd	$25,$19,$19             	# [109]  
	fmuld	$19,$5,$19              	# [116]  
	fmad	$3,$4,$19,$3             	# [123]  
	fldd	$19,1320($16)            	# [123]  id:1449 slave+0x0
	fstd	$3,1304($8)              	# [133]  id:1455 slave+0x0
	fldd	$1,1304($16)             	# [134]  id:1450 slave+0x0
	ldi	$16,32($16)               	# [134]  
	faddd	$1,$2,$1                	# [138]  
	faddd	$19,$1,$1               	# [145]  
	fmuld	$1,$5,$1                	# [152]  
	fmad	$25,$4,$1,$25            	# [159]  
	fstd	$25,1312($8)             	# [169]  id:1455 slave+0x0
	ldi	$8,32($8)                 	# [169]  
#<bpre> branch predict taken
	beq	$24,.L_BB236_stencil_core 	# [170]  
#Block: 243 Pred: 236 Succ: 241 
.L_BB243_stencil_core:	# 0xe7c
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:243 frequency = 0.24786 (heuristic)
#<freq>
#Block: 241 Pred: 237 243 Succ: 235 
.L_BB241_stencil_core:	# 0xe7c
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:241 frequency = 0.00000 (heuristic)
#<freq>
#Block: 235 Pred: 241 Succ: 102 
.L_BB235_stencil_core:	# 0xe7c
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:235 frequency = 0.31726 (heuristic)
#<freq>
#Block: 102 Pred: 235 Succ: 103 99 
.L_BB102_stencil_core:	# 0xe7c
#<loop> Part of loop body line 183, head labeled .Lt_1_199
#<freq>
#<freq> BB:102 frequency = 0.31726 (heuristic)
#<freq> BB:102 => BB:103 probability = 1.00000
#<freq> BB:102 => BB:99 probability = 0.00000
#<freq>
	addw	$11,1,$11                	# [0]  
	ldi	$20,160($20)              	# [0]  
	cmpeq	$11,$6,$23              	# [1]  
	ldi	$21,160($21)              	# [1]  
#<bpre> branch predict not taken
	beq	$23,.Lt_1_199.bpre        	# [2]  
#Block: 103 Pred: 102 89 90 92 319 Succ: 104 81 
.Lt_1_195:	# 0xe90
.Lt_1_193:	# 0xe90
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:103 frequency = 0.50000 (heuristic)
#<freq> BB:103 => BB:104 probability = 1.00000
#<freq> BB:103 => BB:81 probability = 0.00000
#<freq>
	addw	$18,1,$18                	# [1]  
	ldi	$26,1120($26)             	# [1]  
	cmpeq	$18,$12,$24             	# [2]  
	ldi	$15,1120($15)             	# [2]  
	ldi	$13,140($13)              	# [3]  
#<bpre> branch predict not taken
	beq	$24,.Lt_1_180.bpre        	# [3]  
#Block: 104 Pred: 103 Succ: 106 78 
.L_BB104_stencil_core:	# 0xea8
#<freq>
#<freq> BB:104 frequency = 0.50000 (heuristic)
#<freq> BB:104 => BB:106 probability = 0.07201
#<freq> BB:104 => BB:78 probability = 0.92799
#<freq>
	ldl	$25,576($sp)              	# [0]  gra_spill_temp_64
#<bpre> branch predict taken
	br .L_BB104_stencil_core.bpre1
.Lt_1_309.bpre.L_BB104_stencil_core:
	br .Lt_1_309
.L_BB104_stencil_core.bpre1:
	bne	$25,.Lt_1_309.bpre.L_BB104_stencil_core 	# [4]  
#Block: 106 Pred: 76 104 Succ: 110 
.Lt_1_323:	# 0xeb0
.Lt_1_207:	# 0xeb0
#<freq>
#<freq> BB:106 frequency = 0.11601 (heuristic)
#<freq>
	ldl	$27,568($sp)              	# [0]  gra_spill_temp_63
	sll	$14,2,$1                  	# [0]  
	s8subl	$1,$1,$1               	# [1]  
	s4addl	$14,$14,$28            	# [1]  
	s4addl	$28,$31,$28            	# [2]  
	s4addl	$1,$1,$1               	# [2]  
	stl	$1,560($sp)               	# [3]  gra_spill_temp_62
	s4addl	$27,$27,$27            	# [4]  
	s4addl	$27,$31,$27            	# [5]  
	stl	$28,152($sp)              	# [5]  gra_spill_temp_11
	stl	$27,136($sp)              	# [6]  gra_spill_temp_9
	br	$31,.Lt_1_206              	# [7]  
#Block: 74 Pred: 69 Succ: 76 
.Lt_1_321:	# 0xee0
#<freq>
#<freq> BB:74 frequency = 0.37500 (heuristic)
#<freq>
	mov	3,$28                     	# [0]  
	cmple	$28,$14,$28             	# [1]  
	stl	$28,552($sp)              	# [2]  gra_spill_temp_61
#Block: 76 Pred: 74 75 Succ: 77 106 
.Lt_1_177:	# 0xeec
#<freq>
#<freq> BB:76 frequency = 0.50000 (heuristic)
#<freq> BB:76 => BB:77 probability = 0.84000
#<freq> BB:76 => BB:106 probability = 0.16000
#<freq>
	ldl	$1,576($sp)               	# [0]  gra_spill_temp_64
#<bpre> branch predict not taken
	beq	$1,.Lt_1_323.bpre         	# [4]  
#Block: 77 Pred: 76 Succ: 78 
.L_BB77_stencil_core:	# 0xef4
#<freq>
#<freq> BB:77 frequency = 0.42000 (heuristic)
#<freq>
	ldl	$7,664($sp)               	# [0]  gra_spill_temp_75
	subw	$7,3,$7                  	# [4]  
#Block: 78 Pred: 77 104 Succ: 244 
.Lt_1_309:	# 0xefc
#<freq>
#<freq> BB:78 frequency = 0.88399 (heuristic)
#<freq>
	ldl	$23,568($sp)              	# [0]  gra_spill_temp_63
	sll	$14,2,$25                 	# [0]  
	ldl	$12,704($sp)              	# [1]  gra_spill_temp_80
	s8subl	$25,$25,$25            	# [1]  
	ldl	$6,720($sp)               	# [2]  gra_spill_temp_82
	s4addl	$25,$25,$25            	# [2]  
	ldl	$13,592($sp)              	# [3]  gra_spill_temp_66
	s4addl	$14,$14,$26            	# [3]  
	ldl	$17,584($sp)              	# [4]  gra_spill_temp_65
	s4addl	$23,$23,$23            	# [4]  
	ldl	$8,608($sp)               	# [5]  gra_spill_temp_68
	s4addl	$23,$25,$20            	# [5]  
	ldl	$19,600($sp)              	# [6]  gra_spill_temp_67
	addl	$20,$6,$22               	# [6]  
	ldl	$16,712($sp)              	# [7]  gra_spill_temp_81
	addl	$20,$12,$20              	# [7]  
	s4addl	$23,$31,$15            	# [8]  
	s4addl	$23,$6,$24             	# [8]  
	s4addl	$23,$12,$23            	# [9]  
	s4addl	$26,$31,$26            	# [9]  
	stl	$25,560($sp)              	# [10]  gra_spill_temp_62
	addl	$25,$6,$27               	# [10]  
	addl	$25,$12,$25              	# [11]  
	s8addl	$12,$16,$12            	# [11]  
	s8addl	$25,$16,$25            	# [12]  
	s8addl	$27,$16,$27            	# [12]  
	s8addl	$6,$16,$6              	# [13]  
	s8addl	$26,$17,$11            	# [13]  
	s8addl	$26,$13,$21            	# [14]  
	s8addl	$23,$16,$23            	# [14]  
	s8addl	$24,$16,$24            	# [15]  
	s8addl	$15,$19,$9             	# [15]  
	s8addl	$15,$8,$28             	# [16]  
	s8addl	$20,$16,$20            	# [16]  
	s8addl	$22,$16,$22            	# [17]  
	mov	$31,$16                   	# [17]  
#Block: 244 Pred: 78 Succ: 109 
.L_BB244_stencil_core:	# 0xf8c
#<freq>
#<freq> BB:244 frequency = 0.88399 (heuristic)
#<freq>
	.loc	1	192	0
# 188    //7.1 compute up and down line of k dimensional change
# 189    for(k = 1; k < k_region; ++k)
# 190    {
# 191      //left face
# 192      slave[lhs_no][0][0][k] = alpha_d * slave[rhs_no][0][0][k] + \
	fldd	$10,8($6)                	# [0]  
	stl	$15,136($sp)              	# [1]  gra_spill_temp_9
	stl	$26,152($sp)              	# [2]  gra_spill_temp_11
#Block: 109 Pred: 109 244 Succ: 245 109 
	.align	4
.Lt_1_210:	# 0xf98
#<loop> Loop body line 183, nesting depth: 1, estimated iterations: 18
#<freq>
#<freq> BB:109 frequency = 15.91188 (heuristic)
#<freq> BB:109 => BB:245 probability = 0.05556
#<freq> BB:109 => BB:109 probability = 0.94444
#<freq>
	fldd	$3,1128($6)              	# [0]  id:1462 slave+0x0
	mov	$10,$15                   	# [0]  
	fldd	$2,8($19)                	# [1]  id:1461 A_us+0x0
	.loc	1	205	0
# 201      slave[lhs_no][0][j_region][k] = alpha_d * slave[rhs_no][0][j_region][k]+ \
# 202                       beta_d * (A_us[j_region][k] + slave[rhs_no][1][j_region][k] +\
# 203                       slave[rhs_no][0][j_j][k] + A_rs[0][k]+\
# 204                       slave[rhs_no][0][j_region][k-1] + slave[rhs_no][0][j_region][k+1]);
# 205      slave[lhs_no][i_region][j_region][k] = alpha_d * slave[rhs_no][i_region][j_region][k] + \
	addw	$16,1,$16                	# [1]  
	.loc	1	192	0
	fldd	$1,8($17)                	# [2]  id:1460 A_ls+0x0
	.loc	1	205	0
	ldi	$17,8($17)                	# [2]  
	.loc	1	192	0
	fldd	$26,168($6)              	# [3]  id:1459 slave+0x0
	.loc	1	205	0
	ldi	$19,8($19)                	# [3]  
	.loc	1	192	0
	fldd	$18,0($6)                	# [4]  id:1458 slave+0x0
	faddd	$2,$3,$2                	# [5]  
	fldd	$10,16($6)               	# [6]  id:1457 slave+0x0
	.loc	1	205	0
	ldi	$6,8($6)                  	# [6]  
	.loc	1	196	0
	fldd	$3,8($8)                 	# [7]  id:1470 A_ds+0x0
	.loc	1	205	0
	ldi	$8,8($8)                  	# [7]  
	.loc	1	192	0
	faddd	$1,$2,$1                	# [12]  
	faddd	$26,$1,$26              	# [19]  
	.loc	1	196	0
	fldd	$1,-152($11)             	# [19]  id:1468 A_ls+0x0
	.loc	1	205	0
	ldi	$11,8($11)                	# [20]  
	.loc	1	192	0
	faddd	$18,$26,$18             	# [26]  
	.loc	1	196	0
	fldd	$26,-952($27)            	# [27]  id:1467 slave+0x0
	.loc	1	192	0
	faddd	$10,$18,$18             	# [33]  
	fmuld	$18,$5,$18              	# [40]  
	fmad	$15,$4,$18,$15           	# [47]  
	.loc	1	196	0
	fldd	$18,-1120($27)           	# [47]  id:1466 slave+0x0
	.loc	1	192	0
	fstd	$15,8($12)               	# [57]  id:1463 slave+0x0
	.loc	1	205	0
	ldi	$12,8($12)                	# [57]  
	.loc	1	196	0
	fldd	$2,-2232($27)            	# [58]  id:1469 slave+0x0
	fldd	$15,-1104($27)           	# [59]  id:1465 slave+0x0
	faddd	$2,$3,$2                	# [62]  
	fldd	$3,-1112($27)            	# [63]  id:1464 slave+0x0
	.loc	1	205	0
	ldi	$27,8($27)                	# [63]  
	.loc	1	196	0
	faddd	$1,$2,$1                	# [69]  
	faddd	$26,$1,$26              	# [76]  
	.loc	1	201	0
	fldd	$1,-152($9)              	# [76]  id:1477 A_us+0x0
	.loc	1	205	0
	ldi	$9,8($9)                  	# [77]  
	.loc	1	196	0
	faddd	$18,$26,$18             	# [83]  
	faddd	$15,$18,$15             	# [90]  
	.loc	1	201	0
	fldd	$18,8($13)               	# [90]  id:1475 A_rs+0x0
	.loc	1	205	0
	ldi	$13,8($13)                	# [91]  
	.loc	1	196	0
	fmuld	$15,$5,$15              	# [97]  
	fmad	$3,$4,$15,$3             	# [104]  
	.loc	1	201	0
	fldd	$15,-160($24)            	# [104]  id:1474 slave+0x0
	.loc	1	196	0
	fstd	$3,-1112($25)            	# [114]  id:1471 slave+0x0
	.loc	1	205	0
	ldi	$25,8($25)                	# [114]  
	.loc	1	201	0
	fldd	$2,968($24)              	# [115]  id:1478 slave+0x0
	fldd	$26,-312($24)            	# [116]  id:1476 slave+0x0
	faddd	$1,$2,$1                	# [119]  
	fldd	$3,-144($24)             	# [120]  id:1473 slave+0x0
	faddd	$26,$1,$26              	# [126]  
	fldd	$2,-152($24)             	# [127]  id:1472 slave+0x0
	.loc	1	205	0
	ldi	$24,8($24)                	# [127]  
	fldd	$1,-152($28)             	# [128]  id:1486 A_ds+0x0
	ldi	$28,8($28)                	# [128]  
	.loc	1	201	0
	faddd	$18,$26,$18             	# [133]  
	faddd	$15,$18,$15             	# [140]  
	.loc	1	205	0
	fldd	$18,-1432($22)           	# [140]  id:1484 slave+0x0
	.loc	1	201	0
	faddd	$3,$15,$3               	# [147]  
	.loc	1	205	0
	fldd	$15,-152($21)            	# [147]  id:1483 A_rs+0x0
	ldi	$21,8($21)                	# [148]  
	.loc	1	201	0
	fmuld	$3,$5,$3                	# [154]  
	fmad	$2,$4,$3,$2              	# [161]  
	.loc	1	205	0
	fldd	$3,-1280($22)            	# [161]  id:1482 slave+0x0
	.loc	1	201	0
	fstd	$2,-152($23)             	# [171]  id:1479 slave+0x0
	.loc	1	205	0
	ldi	$23,8($23)                	# [171]  
	fldd	$26,-2392($22)           	# [172]  id:1485 slave+0x0
	fldd	$2,-1264($22)            	# [173]  id:1481 slave+0x0
	faddd	$26,$1,$26              	# [176]  
	fldd	$1,-1272($22)            	# [177]  id:1480 slave+0x0
	ldi	$22,8($22)                	# [177]  
	faddd	$18,$26,$18             	# [183]  
	cmpeq	$16,$7,$26              	# [183]  
	faddd	$15,$18,$15             	# [190]  
	faddd	$3,$15,$3               	# [197]  
	faddd	$2,$3,$2                	# [204]  
	fmuld	$2,$5,$2                	# [211]  
	fmad	$1,$4,$2,$1              	# [218]  
	fstd	$1,-1272($20)            	# [228]  id:1487 slave+0x0
	ldi	$20,8($20)                	# [228]  
#<bpre> branch predict taken
	beq	$26,.Lt_1_210             	# [229]  
#Block: 245 Pred: 109 Succ: 110 
.L_BB245_stencil_core:	# 0x10d4
#<freq>
#<freq> BB:245 frequency = 0.88399 (heuristic)
#<freq>
#Block: 110 Pred: 106 245 Succ: 111 121 
.Lt_1_206:	# 0x10d4
#<freq>
#<freq> BB:110 frequency = 1.00000 (heuristic)
#<freq> BB:110 => BB:111 probability = 0.75000
#<freq> BB:110 => BB:121 probability = 0.25000
#<freq>
	ldl	$7,664($sp)               	# [0]  gra_spill_temp_75
	mov	6,$6                      	# [0]  
	cmple	$6,$7,$6                	# [4]  
	stl	$6,384($sp)               	# [5]  gra_spill_temp_40
#<bpre> branch predict not taken
	beq	$6,.Lt_1_213              	# [6]  
#Block: 111 Pred: 110 Succ: 113 
.L_BB111_stencil_core:	# 0x10e8
#<freq>
#<freq> BB:111 frequency = 0.75000 (heuristic)
#<freq>
	ldl	$17,664($sp)              	# [0]  gra_spill_temp_75
	ldi	$18,-21845($31)           	# [0]  
	ldih	$18,-21845($18)          	# [1]  
	ldl	$19,720($sp)              	# [1]  gra_spill_temp_82
	stl	$31,672($sp)              	# [2]  gra_spill_temp_76
	subw	$14,2,$12                	# [2]  
	subw	$17,3,$8                 	# [4]  
	subw	$17,6,$17                	# [4]  
	subw	$31,$8,$16               	# [5]  
	stl	$17,640($sp)              	# [5]  gra_spill_temp_72
	selge	$8,$8,$16,$16           	# [6]  
	stl	$19,656($sp)              	# [6]  gra_spill_temp_74
	umulw	$16,$18,$16             	# [7]  
	ldl	$18,136($sp)              	# [7]  gra_spill_temp_9
	stl	$18,648($sp)              	# [11]  gra_spill_temp_73
	srl	$16,33,$16                	# [12]  
	subw	$31,$16,$17              	# [13]  
	selge	$8,$16,$17,$8           	# [14]  
	stl	$8,104($sp)               	# [15]  gra_spill_temp_5
#Block: 113 Pred: 117 111 Succ: 114 117 
	.align	4
.Lt_1_216:	# 0x1134
#<loop> Loop body line 205, nesting depth: 1, estimated iterations: 5
#<freq>
#<freq> BB:113 frequency = 3.75000 (heuristic)
#<freq> BB:113 => BB:114 probability = 0.92799
#<freq> BB:113 => BB:117 probability = 0.07201
#<freq>
	ldl	$19,552($sp)              	# [0]  gra_spill_temp_61
#<bpre> branch predict not taken
	beq	$19,.Lt_1_217             	# [4]  
#Block: 114 Pred: 113 Succ: 246 
.L_BB114_stencil_core:	# 0x113c
#<loop> Part of loop body line 205, head labeled .Lt_1_216
#<freq>
#<freq> BB:114 frequency = 3.47995 (heuristic)
#<freq>
	ldl	$7,720($sp)               	# [0]  gra_spill_temp_82
	ldl	$19,704($sp)              	# [1]  gra_spill_temp_80
	ldl	$6,648($sp)               	# [2]  gra_spill_temp_73
	ldl	$10,672($sp)              	# [3]  gra_spill_temp_76
	addl	$6,$19,$17               	# [6]  
	addl	$6,$7,$6                 	# [7]  
	ldl	$7,656($sp)               	# [7]  gra_spill_temp_74
	ldl	$16,584($sp)              	# [8]  gra_spill_temp_65
	addl	$10,$19,$19              	# [10]  
	ldl	$24,592($sp)              	# [11]  gra_spill_temp_66
	ldl	$8,712($sp)               	# [12]  gra_spill_temp_81
	s8addl	$10,$24,$24            	# [15]  
	s8addl	$10,$16,$10            	# [16]  
	mov	$31,$16                   	# [16]  
	s8addl	$6,$8,$6               	# [19]  
	s8addl	$19,$8,$19             	# [19]  
	s8addl	$17,$8,$17             	# [20]  
	s8addl	$7,$8,$7               	# [20]  
#Block: 246 Pred: 114 Succ: 116 
.L_BB246_stencil_core:	# 0x1184
#<loop> Part of loop body line 205, head labeled .Lt_1_216
#<freq>
#<freq> BB:246 frequency = 3.47995 (heuristic)
#<freq>
	.loc	1	218	0
# 214         slave[lhs_no][i][0][k] = alpha_d * slave[rhs_no][i][0][k] + \
# 215                       beta_d * (slave[rhs_no][i-1][0][k] + slave[rhs_no][i+1][0][k] +\
# 216                       A_ls[i][k] + slave[rhs_no][i][1][k]+\
# 217                       slave[rhs_no][i][0][k-1] + slave[rhs_no][i][0][k+1]);
# 218         slave[lhs_no][i][j_region][k] = alpha_d * slave[rhs_no][i][j_region][k] + \
	fldd	$23,-144($6)             	# [0]  
	fldd	$22,984($6)              	# [1]  
	.loc	1	214	0
	fldd	$25,16($7)               	# [2]  
	fldd	$20,1144($7)             	# [3]  
	.loc	1	218	0
	fldd	$28,-152($6)             	# [4]  
	fldd	$27,976($6)              	# [5]  
	.loc	1	214	0
	fldd	$8,1128($7)              	# [6]  
	fldd	$21,8($7)                	# [7]  
	fldd	$9,1136($7)              	# [8]  
#Block: 116 Pred: 116 246 Succ: 247 116 
.Lt_1_221:	# 0x11a8
#<loop> Loop body line 205, nesting depth: 2, estimated iterations: 5
#<freq>
#<freq> BB:116 frequency = 17.39975 (heuristic)
#<freq> BB:116 => BB:247 probability = 0.20000
#<freq> BB:116 => BB:116 probability = 0.80000
#<freq>
	mov	$8,$3                     	# [0]  
	fldd	$8,2248($7)              	# [0]  id:1494 slave+0x0
	fldd	$15,168($10)             	# [1]  id:1492 A_ls+0x0
	.loc	1	218	0
	addw	$16,1,$16                	# [1]  
	.loc	1	214	0
	fldd	$13,1288($7)             	# [2]  id:1491 slave+0x0
	faddd	$21,$8,$18              	# [4]  
	fldd	$11,1120($7)             	# [5]  id:1490 slave+0x0
	faddd	$15,$18,$15             	# [11]  
	.loc	1	218	0
	fldd	$2,2088($6)              	# [12]  id:1502 slave+0x0
	.loc	1	214	0
	faddd	$13,$15,$13             	# [18]  
	.loc	1	218	0
	fldd	$26,960($6)              	# [19]  id:1498 slave+0x0
	faddd	$28,$2,$2               	# [22]  
	fldd	$28,168($24)             	# [23]  id:1499 A_rs+0x0
	.loc	1	214	0
	faddd	$11,$13,$11             	# [25]  
	fldd	$18,176($10)             	# [26]  id:1508 A_ls+0x0
	faddd	$9,$11,$11              	# [32]  
	fldd	$13,1296($7)             	# [33]  id:1507 slave+0x0
	fmuld	$11,$5,$11              	# [39]  
	fmad	$3,$4,$11,$3             	# [46]  
	mov	$9,$11                    	# [46]  
	fldd	$9,2256($7)              	# [47]  id:1510 slave+0x0
	faddd	$25,$9,$21              	# [51]  
	fldd	$25,184($10)             	# [51]  id:1524 A_ls+0x0
	.loc	1	218	0
	ldi	$10,160($10)              	# [52]  
	.loc	1	214	0
	fstd	$3,1128($19)             	# [56]  id:1495 slave+0x0
	.loc	1	218	0
	fldd	$1,808($6)               	# [57]  id:1500 slave+0x0
	.loc	1	214	0
	faddd	$18,$21,$18             	# [58]  
	.loc	1	218	0
	fldd	$15,968($6)              	# [59]  id:1496 slave+0x0
	faddd	$1,$2,$1                	# [62]  
	.loc	1	214	0
	faddd	$13,$18,$13             	# [65]  
	fldd	$18,1152($7)             	# [65]  id:1521 slave+0x0
	.loc	1	218	0
	faddd	$28,$1,$28              	# [69]  
	fldd	$1,176($24)              	# [69]  id:1515 A_rs+0x0
	faddd	$26,$28,$26             	# [76]  
	faddd	$27,$26,$26             	# [83]  
	fldd	$27,2096($6)             	# [83]  id:1518 slave+0x0
	faddd	$23,$27,$3              	# [87]  
	fmuld	$26,$5,$26              	# [90]  
	fmad	$15,$4,$26,$15           	# [97]  
	.loc	1	214	0
	fldd	$26,24($7)               	# [97]  id:1525 slave+0x0
	.loc	1	218	0
	fstd	$15,968($17)             	# [107]  id:1503 slave+0x0
	mov	$20,$15                   	# [107]  
	.loc	1	214	0
	fldd	$21,1128($7)             	# [108]  id:1506 slave+0x0
	.loc	1	218	0
	fldd	$28,968($6)              	# [109]  id:1514 slave+0x0
	.loc	1	214	0
	faddd	$21,$13,$13             	# [112]  
	faddd	$20,$13,$13             	# [119]  
	fldd	$20,2264($7)             	# [119]  id:1526 slave+0x0
	faddd	$26,$20,$26             	# [123]  
	fmuld	$13,$5,$13              	# [126]  
	faddd	$25,$26,$25             	# [130]  
	.loc	1	218	0
	cmpeq	$16,$12,$26             	# [130]  
	.loc	1	214	0
	fmad	$11,$4,$13,$11           	# [133]  
	.loc	1	218	0
	fldd	$13,-136($6)             	# [133]  id:1533 slave+0x0
	.loc	1	214	0
	fstd	$11,1136($19)            	# [143]  id:1511 slave+0x0
	.loc	1	218	0
	fldd	$2,816($6)               	# [144]  id:1516 slave+0x0
	fldd	$23,976($6)              	# [145]  id:1512 slave+0x0
	faddd	$2,$3,$2                	# [148]  
	fldd	$3,184($24)              	# [149]  id:1531 A_rs+0x0
	ldi	$24,160($24)              	# [149]  
	faddd	$1,$2,$1                	# [155]  
	fldd	$2,992($6)               	# [155]  id:1529 slave+0x0
	faddd	$28,$1,$1               	# [162]  
	faddd	$22,$1,$1               	# [169]  
	.loc	1	214	0
	fldd	$22,1304($7)             	# [169]  id:1523 slave+0x0
	faddd	$22,$25,$22             	# [173]  
	.loc	1	218	0
	fmuld	$1,$5,$1                	# [176]  
	fmad	$23,$4,$1,$23            	# [183]  
	fstd	$23,976($17)             	# [193]  id:1519 slave+0x0
	.loc	1	214	0
	fldd	$25,1136($7)             	# [194]  id:1522 slave+0x0
	.loc	1	218	0
	ldi	$7,1120($7)               	# [194]  
	fldd	$23,976($6)              	# [195]  id:1530 slave+0x0
	.loc	1	214	0
	faddd	$25,$22,$22             	# [198]  
	faddd	$18,$22,$18             	# [205]  
	.loc	1	218	0
	fldd	$22,2104($6)             	# [205]  id:1534 slave+0x0
	faddd	$13,$22,$13             	# [209]  
	.loc	1	214	0
	fmuld	$18,$5,$18              	# [212]  
	fmad	$15,$4,$18,$15           	# [219]  
	fstd	$15,1144($19)            	# [229]  id:1527 slave+0x0
	.loc	1	218	0
	ldi	$19,1120($19)             	# [229]  
	fldd	$11,824($6)              	# [230]  id:1532 slave+0x0
	fldd	$1,984($6)               	# [231]  id:1528 slave+0x0
	ldi	$6,1120($6)               	# [231]  
	faddd	$11,$13,$11             	# [234]  
	faddd	$3,$11,$3               	# [241]  
	faddd	$23,$3,$3               	# [248]  
	faddd	$2,$3,$2                	# [255]  
	fmuld	$2,$5,$2                	# [262]  
	fmad	$1,$4,$2,$1              	# [269]  
	fstd	$1,984($17)              	# [279]  id:1535 slave+0x0
	ldi	$17,1120($17)             	# [279]  
#<bpre> branch predict taken
	beq	$26,.Lt_1_221             	# [280]  
#Block: 247 Pred: 116 Succ: 117 
.L_BB247_stencil_core:	# 0x1314
#<loop> Part of loop body line 205, head labeled .Lt_1_216
#<freq>
#<freq> BB:247 frequency = 3.47995 (heuristic)
#<freq>
#Block: 117 Pred: 247 113 Succ: 118 113 
.Lt_1_217:	# 0x1314
#<loop> Part of loop body line 205, head labeled .Lt_1_216
#<freq>
#<freq> BB:117 frequency = 3.75000 (heuristic)
#<freq> BB:117 => BB:118 probability = 0.20000
#<freq> BB:117 => BB:113 probability = 0.80000
#<freq>
	ldl	$19,672($sp)              	# [0]  gra_spill_temp_76
	ldl	$20,640($sp)              	# [1]  gra_spill_temp_72
	addw	$19,3,$19                	# [4]  
	stl	$19,672($sp)              	# [5]  gra_spill_temp_76
	cmple	$19,$20,$19             	# [8]  
	ldl	$20,656($sp)              	# [9]  gra_spill_temp_74
	ldl	$21,648($sp)              	# [10]  gra_spill_temp_73
	ldi	$20,3($20)                	# [13]  
	stl	$20,656($sp)              	# [14]  gra_spill_temp_74
	ldi	$21,3($21)                	# [17]  
	stl	$21,648($sp)              	# [18]  gra_spill_temp_73
#<bpre> branch predict taken
	bne	$19,.Lt_1_216             	# [19]  
#Block: 118 Pred: 117 Succ: 119 130 
.L_BB118_stencil_core:	# 0x1344
#<freq>
#<freq> BB:118 frequency = 0.75000 (heuristic)
#<freq> BB:118 => BB:119 probability = 0.50000
#<freq> BB:118 => BB:130 probability = 0.50000
#<freq>
	ldl	$23,664($sp)              	# [0]  gra_spill_temp_75
	ldl	$22,672($sp)              	# [1]  gra_spill_temp_76
	subw	$23,4,$23                	# [4]  
	cmple	$22,$23,$22             	# [8]  
#<bpre> branch predict unknown
	beq	$22,.Lt_1_226             	# [9]  
#Block: 119 Pred: 118 121 Succ: 120 130 
.Lt_1_310:	# 0x1358
#<freq>
#<freq> BB:119 frequency = 0.58500 (heuristic)
#<freq> BB:119 => BB:120 probability = 0.94030
#<freq> BB:119 => BB:130 probability = 0.05970
#<freq>
	ldl	$24,552($sp)              	# [0]  gra_spill_temp_61
#<bpre> branch predict not taken
	beq	$24,.Lt_1_226             	# [4]  
#Block: 120 Pred: 119 Succ: 126 
.L_BB120_stencil_core:	# 0x1360
#<freq>
#<freq> BB:120 frequency = 0.55007 (heuristic)
#<freq>
	ldl	$23,672($sp)              	# [0]  gra_spill_temp_76
	subw	$14,2,$12                	# [0]  
	ldl	$7,664($sp)               	# [1]  gra_spill_temp_75
	ldl	$24,136($sp)              	# [2]  gra_spill_temp_9
	subw	$7,$23,$8                	# [5]  
	ldl	$22,720($sp)              	# [6]  gra_spill_temp_82
	subw	$8,3,$8                  	# [6]  
	stl	$8,96($sp)                	# [7]  gra_spill_temp_4
	subw	$7,3,$7                  	# [7]  
	addl	$23,$24,$24              	# [9]  
	addl	$23,$22,$22              	# [10]  
#Block: 126 Pred: 129 120 Succ: 248 
.Lt_1_230:	# 0x138c
#<loop> Loop body line 218, nesting depth: 1, estimated iterations: 2
#<freq>
#<freq> BB:126 frequency = 1.10015 (heuristic)
#<freq>
	ldl	$8,720($sp)               	# [0]  gra_spill_temp_82
	mov	$23,$25                   	# [0]  
	ldl	$6,704($sp)               	# [1]  gra_spill_temp_80
	mov	$22,$27                   	# [1]  
	ldl	$17,584($sp)              	# [2]  gra_spill_temp_65
	mov	$31,$20                   	# [2]  
	ldl	$19,592($sp)              	# [3]  gra_spill_temp_66
	mov	$24,$18                   	# [3]  
	ldl	$21,712($sp)              	# [4]  gra_spill_temp_81
	addl	$24,$8,$8                	# [4]  
	addl	$24,$6,$16               	# [5]  
	addl	$23,$6,$6                	# [5]  
	s8addl	$23,$17,$17            	# [6]  
	stl	$27,120($sp)              	# [6]  gra_spill_temp_7
	s8addl	$23,$19,$19            	# [7]  
	stl	$25,128($sp)              	# [7]  gra_spill_temp_8
	s8addl	$6,$21,$6              	# [8]  
	s8addl	$16,$21,$16            	# [8]  
	s8addl	$8,$21,$8              	# [9]  
	s8addl	$22,$21,$21            	# [9]  
#Block: 248 Pred: 126 Succ: 252 251 
.L_BB248_stencil_core:	# 0x13dc
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<freq>
#<freq> BB:248 frequency = 1.10015 (heuristic)
#<freq> BB:248 => BB:252 probability = 0.50000
#<freq> BB:248 => BB:251 probability = 0.50000
#<freq>
	.loc	1	214	0
	fldd	$23,1128($21)            	# [0]  
	and	$12,1,$24                 	# [0]  
	mov	$23,$22                   	# [4]  
#<bpre> branch predict unknown
	beq	$24,.L_BB251_stencil_core 	# [4]  
#Block: 252 Pred: 248 Succ: 251 
.L_BB252_stencil_core:	# 0x13ec
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<loop> Unrolling remainder loop (at most 1 iteration)
#<freq>
#<freq> BB:252 frequency = 0.55007 (heuristic)
#<freq>
	fldd	$22,2248($21)            	# [0]  id:1542 slave+0x0
	fldd	$1,8($21)                	# [1]  id:1541 slave+0x0
	fldd	$28,168($17)             	# [2]  id:1540 A_ls+0x0
	.loc	1	218	0
	ldi	$17,160($17)              	# [2]  
	.loc	1	214	0
	fldd	$27,1288($21)            	# [3]  id:1539 slave+0x0
	faddd	$1,$22,$1               	# [5]  
	fldd	$25,1120($21)            	# [6]  id:1538 slave+0x0
	faddd	$28,$1,$28              	# [12]  
	fldd	$24,1136($21)            	# [13]  id:1537 slave+0x0
	.loc	1	218	0
	ldi	$21,1120($21)             	# [13]  
	fldd	$20,2088($8)             	# [14]  id:1550 slave+0x0
	.loc	1	214	0
	faddd	$27,$28,$27             	# [19]  
	.loc	1	218	0
	fldd	$3,-152($8)              	# [20]  id:1549 slave+0x0
	.loc	1	214	0
	faddd	$25,$27,$25             	# [26]  
	.loc	1	218	0
	fldd	$1,168($19)              	# [27]  id:1547 A_rs+0x0
	ldi	$19,160($19)              	# [27]  
	fldd	$28,960($8)              	# [28]  id:1546 slave+0x0
	faddd	$3,$20,$3               	# [30]  
	fldd	$27,976($8)              	# [31]  id:1545 slave+0x0
	addw	$31,1,$20                	# [31]  
	.loc	1	214	0
	faddd	$24,$25,$24             	# [33]  
	fmuld	$24,$5,$24              	# [40]  
	fmad	$23,$4,$24,$24           	# [47]  
	fstd	$24,1128($6)             	# [57]  id:1543 slave+0x0
	.loc	1	218	0
	ldi	$6,1120($6)               	# [57]  
	fldd	$2,808($8)               	# [58]  id:1548 slave+0x0
	fldd	$25,968($8)              	# [59]  id:1544 slave+0x0
	ldi	$8,1120($8)               	# [59]  
	faddd	$2,$3,$2                	# [62]  
	faddd	$1,$2,$1                	# [69]  
	faddd	$28,$1,$28              	# [76]  
	faddd	$27,$28,$27             	# [83]  
	fmuld	$27,$5,$27              	# [90]  
	fmad	$25,$4,$27,$25           	# [97]  
	fstd	$25,968($16)             	# [107]  id:1551 slave+0x0
	ldi	$16,1120($16)             	# [107]  
#Block: 251 Pred: 248 252 Succ: 254 253 
.L_BB251_stencil_core:	# 0x147c
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<freq>
#<freq> BB:251 frequency = 1.10015 (heuristic)
#<freq> BB:251 => BB:254 probability = 0.50000
#<freq> BB:251 => BB:253 probability = 0.50000
#<freq>
	sra	$12,1,$23                 	# [0]  
#<bpre> branch predict unknown
	beq	$23,.L_BB253_stencil_core 	# [1]  
#Block: 254 Pred: 251 Succ: 250 
.L_BB254_stencil_core:	# 0x1484
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<freq>
#<freq> BB:254 frequency = 0.55007 (heuristic)
#<freq>
	stl	$23,744($sp)              	# [0]  gra_spill_temp_85
#Block: 250 Pred: 250 254 Succ: 250 255 
.L_BB250_stencil_core:	# 0x1488
#<loop> Loop body line 218, nesting depth: 2, estimated iterations: 2
#<loop> unrolled 2 times
#<freq>
#<freq> BB:250 frequency = 1.92526 (heuristic)
#<freq> BB:250 => BB:250 probability = 0.50000
#<freq> BB:250 => BB:255 probability = 0.50000
#<freq>
	.loc	1	214	0
	fldd	$15,2248($21)            	# [0]  id:1542 slave+0x0
	.loc	1	218	0
	addw	$20,2,$20                	# [0]  
	.loc	1	214	0
	fldd	$25,8($21)               	# [1]  id:1541 slave+0x0
	fldd	$24,168($17)             	# [2]  id:1540 A_ls+0x0
	faddd	$25,$15,$25             	# [5]  
	fldd	$23,1288($21)            	# [6]  id:1539 slave+0x0
	faddd	$24,$25,$24             	# [12]  
	fldd	$13,1120($21)            	# [13]  id:1538 slave+0x0
	faddd	$23,$24,$23             	# [19]  
	fldd	$11,1136($21)            	# [20]  id:1537 slave+0x0
	faddd	$13,$23,$13             	# [26]  
	.loc	1	218	0
	fldd	$10,-152($8)             	# [27]  id:1549 slave+0x0
	.loc	1	214	0
	faddd	$11,$13,$11             	# [33]  
	.loc	1	218	0
	fldd	$13,2088($8)             	# [34]  id:1550 slave+0x0
	.loc	1	214	0
	fmuld	$11,$5,$11              	# [40]  
	.loc	1	218	0
	fldd	$3,168($19)              	# [41]  id:1547 A_rs+0x0
	faddd	$10,$13,$10             	# [44]  
	fldd	$2,960($8)               	# [45]  id:1546 slave+0x0
	.loc	1	214	0
	fmad	$22,$4,$11,$11           	# [47]  
	.loc	1	218	0
	fldd	$1,976($8)               	# [48]  id:1545 slave+0x0
	.loc	1	214	0
	fldd	$22,3368($21)            	# [49]  id:1542 slave+0x0
	fldd	$26,328($17)             	# [50]  id:1540 A_ls+0x0
	.loc	1	218	0
	ldi	$17,320($17)              	# [50]  
	.loc	1	214	0
	fldd	$25,2408($21)            	# [51]  id:1539 slave+0x0
	fldd	$24,2240($21)            	# [52]  id:1538 slave+0x0
	fldd	$23,2256($21)            	# [53]  id:1537 slave+0x0
	fstd	$11,1128($6)             	# [57]  id:1543 slave+0x0
	.loc	1	218	0
	fldd	$9,808($8)               	# [58]  id:1548 slave+0x0
	fldd	$28,968($8)              	# [59]  id:1544 slave+0x0
	faddd	$9,$10,$9               	# [62]  
	fldd	$10,328($19)             	# [63]  id:1547 A_rs+0x0
	ldi	$19,320($19)              	# [63]  
	faddd	$3,$9,$3                	# [69]  
	fldd	$9,2080($8)              	# [69]  id:1546 slave+0x0
	faddd	$2,$3,$2                	# [76]  
	fldd	$3,2096($8)              	# [76]  id:1545 slave+0x0
	faddd	$1,$2,$1                	# [83]  
	fmuld	$1,$5,$1                	# [90]  
	fmad	$28,$4,$1,$28            	# [97]  
	cmpeq	$20,$12,$1              	# [97]  
	fstd	$28,968($16)             	# [107]  id:1551 slave+0x0
	.loc	1	214	0
	fldd	$27,1128($21)            	# [108]  id:1541 slave+0x0
	.loc	1	218	0
	ldi	$21,2240($21)             	# [108]  
	fldd	$13,968($8)              	# [109]  id:1549 slave+0x0
	.loc	1	214	0
	faddd	$27,$22,$27             	# [112]  
	faddd	$26,$27,$26             	# [119]  
	faddd	$25,$26,$25             	# [126]  
	faddd	$24,$25,$24             	# [133]  
	faddd	$23,$24,$23             	# [140]  
	fmuld	$23,$5,$23              	# [147]  
	fmad	$15,$4,$23,$15           	# [154]  
	.loc	1	218	0
	fldd	$23,3208($8)             	# [154]  id:1550 slave+0x0
	faddd	$13,$23,$13             	# [158]  
	.loc	1	214	0
	fstd	$15,2248($6)             	# [164]  id:1543 slave+0x0
	.loc	1	218	0
	fldd	$11,1928($8)             	# [165]  id:1548 slave+0x0
	ldi	$6,2240($6)               	# [165]  
	fldd	$2,2088($8)              	# [166]  id:1544 slave+0x0
	ldi	$8,2240($8)               	# [166]  
	faddd	$11,$13,$11             	# [169]  
	faddd	$10,$11,$10             	# [176]  
	faddd	$9,$10,$9               	# [183]  
	faddd	$3,$9,$3                	# [190]  
	fmuld	$3,$5,$3                	# [197]  
	fmad	$2,$4,$3,$2              	# [204]  
	fstd	$2,2088($16)             	# [214]  id:1551 slave+0x0
	ldi	$16,2240($16)             	# [214]  
#<bpre> branch predict unknown
	beq	$1,.L_BB250_stencil_core  	# [215]  
#Block: 255 Pred: 250 Succ: 253 
.L_BB255_stencil_core:	# 0x1594
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<freq>
#<freq> BB:255 frequency = 0.96263 (heuristic)
#<freq>
#Block: 253 Pred: 251 255 Succ: 249 
.L_BB253_stencil_core:	# 0x1594
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<freq>
#<freq> BB:253 frequency = 0.00000 (heuristic)
#<freq>
	ldl	$8,128($sp)               	# [0]  gra_spill_temp_8
	ldl	$6,120($sp)               	# [1]  gra_spill_temp_7
#Block: 249 Pred: 253 Succ: 129 
.L_BB249_stencil_core:	# 0x159c
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<freq>
#<freq> BB:249 frequency = 1.10015 (heuristic)
#<freq>
#Block: 129 Pred: 249 Succ: 130 126 
.L_BB129_stencil_core:	# 0x159c
#<loop> Part of loop body line 218, head labeled .Lt_1_230
#<freq>
#<freq> BB:129 frequency = 1.10015 (heuristic)
#<freq> BB:129 => BB:130 probability = 0.50000
#<freq> BB:129 => BB:126 probability = 0.50000
#<freq>
	addw	$8,1,$23                 	# [0]  
	ldi	$24,1($18)                	# [0]  
	cmpeq	$23,$7,$27              	# [1]  
	ldi	$22,1($6)                 	# [1]  
#<bpre> branch predict unknown
	beq	$27,.Lt_1_230             	# [2]  
#Block: 130 Pred: 119 129 118 316 Succ: 131 141 
.Lt_1_226:	# 0x15b0
.Lt_1_224:	# 0x15b0
#<freq>
#<freq> BB:130 frequency = 1.00000 (heuristic)
#<freq> BB:130 => BB:131 probability = 0.94030
#<freq> BB:130 => BB:141 probability = 0.05970
#<freq>
	ldl	$28,384($sp)              	# [0]  gra_spill_temp_40
#<bpre> branch predict not taken
	beq	$28,.Lt_1_237             	# [4]  
#Block: 131 Pred: 130 Succ: 133 
.L_BB131_stencil_core:	# 0x15b8
#<freq>
#<freq> BB:131 frequency = 0.94030 (heuristic)
#<freq>
	ldl	$3,664($sp)               	# [0]  gra_spill_temp_75
	ldi	$6,-21845($31)            	# [0]  
	ldih	$6,-21845($6)            	# [1]  
	ldl	$7,720($sp)               	# [1]  gra_spill_temp_82
	stl	$31,696($sp)              	# [2]  gra_spill_temp_79
	subw	$3,3,$1                  	# [4]  
	subw	$31,$1,$2                	# [5]  
	subw	$3,6,$3                  	# [5]  
	selge	$1,$1,$2,$2             	# [6]  
	stl	$3,640($sp)               	# [6]  gra_spill_temp_72
	umulw	$2,$6,$2                	# [7]  
	ldl	$6,568($sp)               	# [7]  gra_spill_temp_63
	stl	$7,680($sp)               	# [8]  gra_spill_temp_77
	subw	$6,2,$6                  	# [11]  
	srl	$2,33,$2                  	# [12]  
	stl	$31,688($sp)              	# [12]  gra_spill_temp_78
	subw	$31,$2,$3                	# [13]  
	selge	$1,$2,$3,$1             	# [14]  
	stl	$1,192($sp)               	# [15]  gra_spill_temp_16
#Block: 133 Pred: 137 131 Succ: 134 137 
.Lt_1_240:	# 0x1604
#<loop> Loop body line 218, nesting depth: 1, estimated iterations: 5
#<freq>
#<freq> BB:133 frequency = 4.70149 (heuristic)
#<freq> BB:133 => BB:134 probability = 0.92799
#<freq> BB:133 => BB:137 probability = 0.07201
#<freq>
	ldl	$7,632($sp)               	# [0]  gra_spill_temp_71
#<bpre> branch predict not taken
	beq	$7,.Lt_1_241              	# [4]  
#Block: 134 Pred: 133 Succ: 256 
.L_BB134_stencil_core:	# 0x160c
#<loop> Part of loop body line 218, head labeled .Lt_1_240
#<freq>
#<freq> BB:134 frequency = 4.36292 (heuristic)
#<freq>
	ldl	$21,696($sp)              	# [0]  gra_spill_temp_79
	ldl	$28,560($sp)              	# [1]  gra_spill_temp_62
	ldl	$8,720($sp)               	# [2]  gra_spill_temp_82
	addl	$21,$28,$28              	# [5]  
	ldl	$1,704($sp)               	# [6]  gra_spill_temp_80
	addl	$28,$8,$8                	# [9]  
	ldl	$7,680($sp)               	# [10]  gra_spill_temp_77
	addl	$21,$1,$21               	# [13]  
	ldl	$16,712($sp)              	# [14]  gra_spill_temp_81
	addl	$28,$1,$28               	# [14]  
	ldl	$17,600($sp)              	# [15]  gra_spill_temp_67
	s8addl	$28,$16,$28            	# [18]  
	s8addl	$8,$16,$8              	# [19]  
	s8addl	$21,$16,$21            	# [19]  
	s8addl	$7,$16,$7              	# [20]  
	ldl	$16,688($sp)              	# [20]  gra_spill_temp_78
	ldl	$19,608($sp)              	# [21]  gra_spill_temp_68
	addl	$16,$19,$19              	# [25]  
	addl	$16,$17,$16              	# [25]  
	mov	$31,$17                   	# [26]  
#Block: 256 Pred: 134 Succ: 136 
.L_BB256_stencil_core:	# 0x165c
#<loop> Part of loop body line 218, head labeled .Lt_1_240
#<freq>
#<freq> BB:256 frequency = 4.36292 (heuristic)
#<freq>
	.loc	1	231	0
# 227        slave[lhs_no][0][j][k] = alpha_d * slave[rhs_no][0][j][k]+ \
# 228                       beta_d * (A_us[j][k] + slave[rhs_no][1][j][k] +\
# 229                       slave[rhs_no][0][j-1][k] + slave[rhs_no][0][j+1][k]+\
# 230                       slave[rhs_no][0][j][k-1] + slave[rhs_no][0][j][k+1]);
# 231        slave[lhs_no][i_region][j][k] =  alpha_d * slave[rhs_no][i_region][j][k] + \
	fldd	$20,-1104($8)            	# [0]  
	fldd	$27,-936($8)             	# [1]  
	.loc	1	227	0
	fldd	$23,16($7)               	# [2]  
	fldd	$22,184($7)              	# [3]  
	.loc	1	231	0
	fldd	$25,-1112($8)            	# [4]  
	fldd	$24,-944($8)             	# [5]  
	.loc	1	227	0
	fldd	$9,168($7)               	# [6]  
	fldd	$10,8($7)                	# [7]  
	fldd	$11,176($7)              	# [8]  
#Block: 136 Pred: 136 256 Succ: 257 136 
	.align	4
.Lt_1_245:	# 0x1680
#<loop> Loop body line 218, nesting depth: 2, estimated iterations: 5
#<freq>
#<freq> BB:136 frequency = 21.81461 (heuristic)
#<freq> BB:136 => BB:257 probability = 0.20000
#<freq> BB:136 => BB:136 probability = 0.80000
#<freq>
	fldd	$13,1288($7)             	# [0]  id:1558 slave+0x0
	mov	$9,$2                     	# [0]  
	fldd	$12,168($16)             	# [1]  id:1557 A_us+0x0
	.loc	1	231	0
	addw	$17,1,$17                	# [1]  
	.loc	1	227	0
	fldd	$9,328($7)               	# [2]  id:1555 slave+0x0
	faddd	$12,$13,$12             	# [5]  
	fldd	$3,160($7)               	# [6]  id:1554 slave+0x0
	faddd	$10,$12,$10             	# [12]  
	.loc	1	231	0
	fldd	$1,168($19)              	# [13]  id:1566 A_ds+0x0
	.loc	1	227	0
	faddd	$9,$10,$10              	# [19]  
	.loc	1	231	0
	fldd	$18,-792($8)             	# [20]  id:1563 slave+0x0
	.loc	1	227	0
	faddd	$3,$10,$3               	# [26]  
	.loc	1	231	0
	fldd	$15,-960($8)             	# [27]  id:1562 slave+0x0
	.loc	1	227	0
	faddd	$11,$3,$3               	# [33]  
	fldd	$12,176($16)             	# [34]  id:1573 A_us+0x0
	fmuld	$3,$5,$3                	# [40]  
	fldd	$13,1296($7)             	# [41]  id:1574 slave+0x0
	fmad	$2,$4,$3,$2              	# [47]  
	mov	$11,$3                    	# [48]  
	fldd	$11,336($7)              	# [48]  id:1571 slave+0x0
	faddd	$12,$13,$12             	# [51]  
	fstd	$2,168($21)              	# [57]  id:1559 slave+0x0
	.loc	1	231	0
	fldd	$26,-2072($8)            	# [58]  id:1565 slave+0x0
	.loc	1	227	0
	faddd	$23,$12,$12             	# [64]  
	.loc	1	231	0
	fldd	$13,-952($8)             	# [65]  id:1560 slave+0x0
	faddd	$26,$1,$26              	# [68]  
	fldd	$2,176($19)              	# [69]  id:1582 A_ds+0x0
	.loc	1	227	0
	faddd	$11,$12,$12             	# [71]  
	.loc	1	231	0
	faddd	$25,$26,$25             	# [75]  
	.loc	1	227	0
	fldd	$26,184($16)             	# [75]  id:1589 A_us+0x0
	.loc	1	231	0
	ldi	$16,160($16)              	# [76]  
	faddd	$18,$25,$18             	# [82]  
	faddd	$15,$18,$15             	# [89]  
	.loc	1	227	0
	fldd	$18,192($7)              	# [89]  id:1585 slave+0x0
	.loc	1	231	0
	faddd	$24,$15,$15             	# [96]  
	fldd	$24,-784($8)             	# [96]  id:1579 slave+0x0
	fmuld	$15,$5,$15              	# [103]  
	fmad	$13,$4,$15,$13           	# [110]  
	mov	$22,$15                   	# [110]  
	fstd	$13,-952($28)            	# [120]  id:1567 slave+0x0
	.loc	1	227	0
	fldd	$10,168($7)              	# [121]  id:1570 slave+0x0
	.loc	1	231	0
	fldd	$25,-952($8)             	# [122]  id:1578 slave+0x0
	.loc	1	227	0
	faddd	$10,$12,$12             	# [125]  
	.loc	1	231	0
	fldd	$13,184($19)             	# [126]  id:1598 A_ds+0x0
	ldi	$19,160($19)              	# [126]  
	.loc	1	227	0
	faddd	$22,$12,$12             	# [132]  
	fldd	$22,344($7)              	# [132]  id:1587 slave+0x0
	fmuld	$12,$5,$12              	# [139]  
	fmad	$3,$4,$12,$3             	# [146]  
	fstd	$3,176($21)              	# [156]  id:1575 slave+0x0
	.loc	1	231	0
	fldd	$1,-2064($8)             	# [157]  id:1581 slave+0x0
	fldd	$23,-944($8)             	# [158]  id:1576 slave+0x0
	faddd	$1,$2,$1                	# [161]  
	fldd	$3,-1096($8)             	# [162]  id:1596 slave+0x0
	faddd	$20,$1,$1               	# [168]  
	.loc	1	227	0
	fldd	$20,24($7)               	# [169]  id:1588 slave+0x0
	.loc	1	231	0
	faddd	$24,$1,$1               	# [175]  
	fldd	$2,-928($8)              	# [176]  id:1593 slave+0x0
	faddd	$25,$1,$1               	# [182]  
	faddd	$27,$1,$27              	# [189]  
	.loc	1	227	0
	fldd	$1,1304($7)              	# [189]  id:1590 slave+0x0
	faddd	$26,$1,$26              	# [193]  
	.loc	1	231	0
	fmuld	$27,$5,$27              	# [196]  
	.loc	1	227	0
	faddd	$20,$26,$20             	# [200]  
	.loc	1	231	0
	cmpeq	$17,$6,$26              	# [200]  
	fmad	$23,$4,$27,$23           	# [203]  
	fldd	$27,-776($8)             	# [203]  id:1595 slave+0x0
	.loc	1	227	0
	faddd	$22,$20,$20             	# [207]  
	.loc	1	231	0
	fstd	$23,-944($28)            	# [213]  id:1583 slave+0x0
	.loc	1	227	0
	fldd	$23,176($7)              	# [214]  id:1586 slave+0x0
	.loc	1	231	0
	ldi	$7,160($7)                	# [214]  
	.loc	1	227	0
	faddd	$23,$20,$20             	# [218]  
	faddd	$18,$20,$18             	# [225]  
	.loc	1	231	0
	fldd	$20,-944($8)             	# [225]  id:1594 slave+0x0
	.loc	1	227	0
	fmuld	$18,$5,$18              	# [232]  
	fmad	$15,$4,$18,$15           	# [239]  
	fstd	$15,184($21)             	# [249]  id:1591 slave+0x0
	.loc	1	231	0
	ldi	$21,160($21)              	# [249]  
	fldd	$12,-2056($8)            	# [250]  id:1597 slave+0x0
	fldd	$1,-936($8)              	# [251]  id:1592 slave+0x0
	ldi	$8,160($8)                	# [251]  
	faddd	$12,$13,$12             	# [254]  
	faddd	$3,$12,$3               	# [261]  
	faddd	$27,$3,$3               	# [268]  
	faddd	$20,$3,$3               	# [275]  
	faddd	$2,$3,$2                	# [282]  
	fmuld	$2,$5,$2                	# [289]  
	fmad	$1,$4,$2,$1              	# [296]  
	fstd	$1,-936($28)             	# [306]  id:1599 slave+0x0
	ldi	$28,160($28)              	# [306]  
#<bpre> branch predict taken
	beq	$26,.Lt_1_245             	# [307]  
#Block: 257 Pred: 136 Succ: 137 
.L_BB257_stencil_core:	# 0x17ec
#<loop> Part of loop body line 218, head labeled .Lt_1_240
#<freq>
#<freq> BB:257 frequency = 4.36292 (heuristic)
#<freq>
#Block: 137 Pred: 257 133 Succ: 138 133 
.Lt_1_241:	# 0x17ec
#<loop> Part of loop body line 218, head labeled .Lt_1_240
#<freq>
#<freq> BB:137 frequency = 4.70149 (heuristic)
#<freq> BB:137 => BB:138 probability = 0.20000
#<freq> BB:137 => BB:133 probability = 0.80000
#<freq>
	ldl	$16,696($sp)              	# [0]  gra_spill_temp_79
	ldl	$17,640($sp)              	# [1]  gra_spill_temp_72
	addw	$16,3,$16                	# [4]  
	stl	$16,696($sp)              	# [5]  gra_spill_temp_79
	cmple	$16,$17,$16             	# [8]  
	ldl	$17,688($sp)              	# [9]  gra_spill_temp_78
	ldl	$18,680($sp)              	# [10]  gra_spill_temp_77
	ldi	$17,24($17)               	# [13]  
	stl	$17,688($sp)              	# [14]  gra_spill_temp_78
	ldi	$18,3($18)                	# [17]  
	stl	$18,680($sp)              	# [18]  gra_spill_temp_77
#<bpre> branch predict taken
	bne	$16,.Lt_1_240             	# [19]  
#Block: 138 Pred: 137 Succ: 139 143 
.L_BB138_stencil_core:	# 0x181c
#<freq>
#<freq> BB:138 frequency = 0.94030 (heuristic)
#<freq> BB:138 => BB:139 probability = 0.55000
#<freq> BB:138 => BB:143 probability = 0.45000
#<freq>
	ldl	$20,664($sp)              	# [0]  gra_spill_temp_75
	ldl	$19,696($sp)              	# [1]  gra_spill_temp_79
	subw	$20,4,$20                	# [4]  
	cmple	$19,$20,$19             	# [8]  
#<bpre> branch predict not taken
	beq	$19,.Lt_1_331             	# [9]  
#Block: 139 Pred: 138 141 Succ: 140 151 
.Lt_1_311:	# 0x1830
#<freq>
#<freq> BB:139 frequency = 0.56882 (heuristic)
#<freq> BB:139 => BB:140 probability = 0.94030
#<freq> BB:139 => BB:151 probability = 0.05970
#<freq>
	ldl	$21,632($sp)              	# [0]  gra_spill_temp_71
#<bpre> branch predict not taken
	beq	$21,.Lt_1_250             	# [4]  
#Block: 140 Pred: 139 Succ: 147 
.L_BB140_stencil_core:	# 0x1838
#<freq>
#<freq> BB:140 frequency = 0.53486 (heuristic)
#<freq>
	.loc	1	289	0
# 285                       A_rs[i_region][0]+ \
# 286                       A_fs[i_region][j_region] + \
# 287                       slave[rhs_no][i_region][j_region][1]); 
# 288    //9.8  compute down_right_back_point
# 289    slave[lhs_no][i_region][j_region][k_region] = alpha_d * \
	ldl	$25,696($sp)              	# [0]  gra_spill_temp_79
	ldl	$7,664($sp)               	# [1]  gra_spill_temp_75
	s8addl	$25,$31,$22            	# [4]  
	ldl	$6,568($sp)               	# [5]  gra_spill_temp_63
	subw	$7,$25,$8                	# [8]  
	ldl	$24,720($sp)              	# [9]  gra_spill_temp_82
	subw	$8,3,$8                  	# [9]  
	stl	$8,88($sp)                	# [10]  gra_spill_temp_3
	subw	$7,3,$7                  	# [10]  
	subw	$6,2,$6                  	# [12]  
	addl	$25,$24,$24              	# [13]  
#Block: 147 Pred: 150 140 Succ: 258 
.Lt_1_254:	# 0x1864
#<loop> Loop body line 289, nesting depth: 1, estimated iterations: 2
#<freq>
#<freq> BB:147 frequency = 1.06971 (heuristic)
#<freq>
	ldl	$20,560($sp)              	# [0]  gra_spill_temp_62
	mov	$25,$13                   	# [0]  
	ldl	$19,720($sp)              	# [1]  gra_spill_temp_82
	mov	$24,$26                   	# [1]  
	ldl	$21,704($sp)              	# [2]  gra_spill_temp_80
	mov	$22,$15                   	# [2]  
	ldl	$8,600($sp)               	# [3]  gra_spill_temp_67
	addl	$25,$20,$20              	# [4]  
	ldl	$16,608($sp)              	# [5]  gra_spill_temp_68
	addl	$20,$19,$19              	# [5]  
	ldl	$23,712($sp)              	# [6]  gra_spill_temp_81
	addl	$20,$21,$20              	# [6]  
	addl	$25,$21,$17              	# [7]  
	mov	$31,$21                   	# [7]  
	addl	$22,$8,$8                	# [8]  
	addl	$22,$16,$16              	# [9]  
	s8addl	$17,$23,$17            	# [10]  
	s8addl	$20,$23,$20            	# [10]  
	s8addl	$19,$23,$19            	# [11]  
	s8addl	$24,$23,$23            	# [11]  
#Block: 258 Pred: 147 Succ: 262 261 
.L_BB258_stencil_core:	# 0x18b4
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<freq>
#<freq> BB:258 frequency = 1.06971 (heuristic)
#<freq> BB:258 => BB:262 probability = 0.50000
#<freq> BB:258 => BB:261 probability = 0.50000
#<freq>
	.loc	1	227	0
	fldd	$24,168($23)             	# [0]  
	and	$6,1,$25                  	# [0]  
	mov	$24,$22                   	# [4]  
#<bpre> branch predict unknown
	beq	$25,.L_BB261_stencil_core 	# [4]  
#Block: 262 Pred: 258 Succ: 261 
.L_BB262_stencil_core:	# 0x18c4
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<loop> Unrolling remainder loop (at most 1 iteration)
#<freq>
#<freq> BB:262 frequency = 0.53486 (heuristic)
#<freq>
	fldd	$2,1288($23)             	# [0]  id:1670 slave+0x0
	fldd	$1,168($8)               	# [1]  id:1669 A_us+0x0
	.loc	1	231	0
	ldi	$8,160($8)                	# [1]  
	.loc	1	227	0
	fldd	$28,8($23)               	# [2]  id:1668 slave+0x0
	faddd	$1,$2,$1                	# [5]  
	fldd	$22,328($23)             	# [6]  id:1667 slave+0x0
	faddd	$28,$1,$28              	# [12]  
	fldd	$27,160($23)             	# [13]  id:1666 slave+0x0
	faddd	$22,$28,$28             	# [19]  
	fldd	$25,176($23)             	# [20]  id:1665 slave+0x0
	.loc	1	231	0
	ldi	$23,160($23)              	# [20]  
	fldd	$21,168($16)             	# [21]  id:1678 A_ds+0x0
	ldi	$16,160($16)              	# [21]  
	fldd	$3,-1112($19)            	# [22]  id:1676 slave+0x0
	.loc	1	227	0
	faddd	$27,$28,$27             	# [26]  
	.loc	1	231	0
	fldd	$2,-792($19)             	# [27]  id:1675 slave+0x0
	.loc	1	227	0
	faddd	$25,$27,$25             	# [33]  
	.loc	1	231	0
	fldd	$1,-960($19)             	# [34]  id:1674 slave+0x0
	.loc	1	227	0
	fmuld	$25,$5,$25              	# [40]  
	.loc	1	231	0
	fldd	$28,-944($19)            	# [41]  id:1673 slave+0x0
	.loc	1	227	0
	fmad	$24,$4,$25,$25           	# [47]  
	fstd	$25,168($17)             	# [57]  id:1671 slave+0x0
	.loc	1	231	0
	ldi	$17,160($17)              	# [57]  
	fldd	$18,-2072($19)           	# [58]  id:1677 slave+0x0
	fldd	$27,-952($19)            	# [59]  id:1672 slave+0x0
	ldi	$19,160($19)              	# [59]  
	faddd	$18,$21,$18             	# [62]  
	addw	$31,1,$21                	# [62]  
	faddd	$3,$18,$3               	# [69]  
	faddd	$2,$3,$2                	# [76]  
	faddd	$1,$2,$1                	# [83]  
	faddd	$28,$1,$28              	# [90]  
	fmuld	$28,$5,$28              	# [97]  
	fmad	$27,$4,$28,$27           	# [104]  
	fstd	$27,-952($20)            	# [114]  id:1679 slave+0x0
	ldi	$20,160($20)              	# [114]  
#Block: 261 Pred: 258 262 Succ: 264 263 
.L_BB261_stencil_core:	# 0x1954
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<freq>
#<freq> BB:261 frequency = 1.06971 (heuristic)
#<freq> BB:261 => BB:264 probability = 0.50000
#<freq> BB:261 => BB:263 probability = 0.50000
#<freq>
	sra	$6,1,$18                  	# [0]  
#<bpre> branch predict unknown
	beq	$18,.L_BB263_stencil_core 	# [1]  
#Block: 264 Pred: 261 Succ: 260 
.L_BB264_stencil_core:	# 0x195c
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<freq>
#<freq> BB:264 frequency = 0.53486 (heuristic)
#<freq>
#Block: 260 Pred: 260 264 Succ: 260 265 
.L_BB260_stencil_core:	# 0x195c
#<loop> Loop body line 289, nesting depth: 2, estimated iterations: 2
#<loop> unrolled 2 times
#<freq>
#<freq> BB:260 frequency = 1.87200 (heuristic)
#<freq> BB:260 => BB:260 probability = 0.50000
#<freq> BB:260 => BB:265 probability = 0.50000
#<freq>
	.loc	1	227	0
	fldd	$1,1288($23)             	# [0]  id:1670 slave+0x0
	.loc	1	231	0
	addw	$21,2,$21                	# [0]  
	.loc	1	227	0
	fldd	$28,168($8)              	# [1]  id:1669 A_us+0x0
	fldd	$27,8($23)               	# [2]  id:1668 slave+0x0
	faddd	$28,$1,$28              	# [5]  
	fldd	$11,328($23)             	# [6]  id:1667 slave+0x0
	faddd	$27,$28,$27             	# [12]  
	fldd	$25,160($23)             	# [13]  id:1666 slave+0x0
	faddd	$11,$27,$27             	# [19]  
	fldd	$24,176($23)             	# [20]  id:1665 slave+0x0
	faddd	$25,$27,$25             	# [26]  
	.loc	1	231	0
	fldd	$12,168($16)             	# [27]  id:1678 A_ds+0x0
	.loc	1	227	0
	faddd	$24,$25,$24             	# [33]  
	.loc	1	231	0
	fldd	$9,-1112($19)            	# [34]  id:1676 slave+0x0
	.loc	1	227	0
	fmuld	$24,$5,$24              	# [40]  
	.loc	1	231	0
	fldd	$3,-792($19)             	# [41]  id:1675 slave+0x0
	.loc	1	227	0
	fmad	$22,$4,$24,$22           	# [47]  
	.loc	1	231	0
	fldd	$2,-960($19)             	# [48]  id:1674 slave+0x0
	fldd	$1,-944($19)             	# [49]  id:1673 slave+0x0
	.loc	1	227	0
	fldd	$27,328($8)              	# [50]  id:1669 A_us+0x0
	.loc	1	231	0
	ldi	$8,320($8)                	# [50]  
	.loc	1	227	0
	fldd	$24,320($23)             	# [51]  id:1666 slave+0x0
	fstd	$22,168($17)             	# [57]  id:1671 slave+0x0
	.loc	1	231	0
	fldd	$10,-2072($19)           	# [58]  id:1677 slave+0x0
	fldd	$28,-952($19)            	# [59]  id:1672 slave+0x0
	faddd	$10,$12,$10             	# [62]  
	.loc	1	227	0
	fldd	$22,488($23)             	# [63]  id:1667 slave+0x0
	.loc	1	231	0
	faddd	$9,$10,$9               	# [69]  
	.loc	1	227	0
	fldd	$12,336($23)             	# [70]  id:1665 slave+0x0
	.loc	1	231	0
	faddd	$3,$9,$3                	# [76]  
	fldd	$10,328($16)             	# [77]  id:1678 A_ds+0x0
	ldi	$16,320($16)              	# [77]  
	faddd	$2,$3,$2                	# [83]  
	faddd	$1,$2,$1                	# [90]  
	fldd	$2,-632($19)             	# [90]  id:1675 slave+0x0
	fmuld	$1,$5,$1                	# [97]  
	fmad	$28,$4,$1,$28            	# [104]  
	.loc	1	227	0
	fldd	$1,1448($23)             	# [104]  id:1670 slave+0x0
	faddd	$27,$1,$27              	# [108]  
	.loc	1	231	0
	fldd	$1,-800($19)             	# [108]  id:1674 slave+0x0
	fstd	$28,-952($20)            	# [114]  id:1679 slave+0x0
	.loc	1	227	0
	fldd	$25,168($23)             	# [115]  id:1668 slave+0x0
	.loc	1	231	0
	ldi	$23,320($23)              	# [115]  
	fldd	$3,-952($19)             	# [116]  id:1676 slave+0x0
	.loc	1	227	0
	faddd	$25,$27,$25             	# [119]  
	.loc	1	231	0
	fldd	$28,-784($19)            	# [120]  id:1673 slave+0x0
	.loc	1	227	0
	faddd	$22,$25,$25             	# [126]  
	faddd	$24,$25,$24             	# [133]  
	.loc	1	231	0
	cmpeq	$21,$6,$25              	# [133]  
	.loc	1	227	0
	faddd	$12,$24,$12             	# [140]  
	fmuld	$12,$5,$12              	# [147]  
	fmad	$11,$4,$12,$11           	# [154]  
	fstd	$11,328($17)             	# [164]  id:1671 slave+0x0
	.loc	1	231	0
	ldi	$17,320($17)              	# [164]  
	fldd	$9,-1912($19)            	# [165]  id:1677 slave+0x0
	fldd	$27,-792($19)            	# [166]  id:1672 slave+0x0
	ldi	$19,320($19)              	# [166]  
	faddd	$9,$10,$9               	# [169]  
	faddd	$3,$9,$3                	# [176]  
	faddd	$2,$3,$2                	# [183]  
	faddd	$1,$2,$1                	# [190]  
	faddd	$28,$1,$28              	# [197]  
	fmuld	$28,$5,$28              	# [204]  
	fmad	$27,$4,$28,$27           	# [211]  
	fstd	$27,-792($20)            	# [221]  id:1679 slave+0x0
	ldi	$20,320($20)              	# [221]  
#<bpre> branch predict unknown
	beq	$25,.L_BB260_stencil_core 	# [222]  
#Block: 265 Pred: 260 Succ: 263 
.L_BB265_stencil_core:	# 0x1a68
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<freq>
#<freq> BB:265 frequency = 0.93600 (heuristic)
#<freq>
#Block: 263 Pred: 261 265 Succ: 259 
.L_BB263_stencil_core:	# 0x1a68
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<freq>
#<freq> BB:263 frequency = 0.00000 (heuristic)
#<freq>
#Block: 259 Pred: 263 Succ: 150 
.L_BB259_stencil_core:	# 0x1a68
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<freq>
#<freq> BB:259 frequency = 1.06971 (heuristic)
#<freq>
#Block: 150 Pred: 259 Succ: 151 147 
.L_BB150_stencil_core:	# 0x1a68
#<loop> Part of loop body line 289, head labeled .Lt_1_254
#<freq>
#<freq> BB:150 frequency = 1.06971 (heuristic)
#<freq> BB:150 => BB:151 probability = 0.50000
#<freq> BB:150 => BB:147 probability = 0.50000
#<freq>
	addw	$13,1,$25                	# [0]  
	ldi	$24,1($26)                	# [0]  
	cmpeq	$25,$7,$2               	# [1]  
	ldi	$22,8($15)                	# [1]  
#<bpre> branch predict unknown
	beq	$2,.Lt_1_254              	# [2]  
#Block: 151 Pred: 150 139 Succ: 144 315 
.Lt_1_250:	# 0x1a7c
#<freq>
#<freq> BB:151 frequency = 0.56882 (heuristic)
#<freq> BB:151 => BB:144 probability = 0.84000
#<freq> BB:151 => BB:315 probability = 0.16000
#<freq>
	.loc	1	238	0
	ldl	$21,424($sp)              	# [0]  gra_spill_temp_45
	ldl	$10,600($sp)              	# [1]  gra_spill_temp_67
	ldl	$27,584($sp)              	# [2]  gra_spill_temp_65
	ldl	$3,536($sp)               	# [3]  gra_spill_temp_59
	fldd	$28,1120($21)            	# [4]  id:1605 slave+0x0
	fldd	$26,0($10)               	# [5]  id:1606 A_us+0x0
	fldd	$25,0($27)               	# [6]  id:1604 A_ls+0x0
	faddd	$26,$28,$26             	# [9]  
	fldd	$24,160($21)             	# [10]  id:1603 slave+0x0
	faddd	$25,$26,$25             	# [16]  
	fldd	$23,0($3)                	# [17]  id:1602 A_fs+0x0
	faddd	$24,$25,$24             	# [23]  
	fldd	$22,8($21)               	# [24]  id:1601 slave+0x0
	faddd	$23,$24,$23             	# [30]  
	fldd	$21,0($21)               	# [31]  id:1600 slave+0x0
	faddd	$22,$23,$22             	# [37]  
	ldl	$20,272($sp)              	# [38]  gra_spill_temp_26
	fmuld	$22,$5,$22              	# [44]  
	.loc	1	243	0
	ldl	$26,664($sp)              	# [45]  gra_spill_temp_75
	.loc	1	238	0
	sll	$20,5,$20                 	# [48]  
	ldl	$16,712($sp)              	# [49]  gra_spill_temp_81
	s8subl	$20,$20,$20            	# [49]  
	.loc	1	243	0
	ldl	$13,720($sp)              	# [50]  gra_spill_temp_82
	.loc	1	238	0
	s8subl	$20,$20,$20            	# [50]  
	fmad	$21,$4,$22,$21           	# [51]  
	.loc	1	243	0
	ldl	$24,144($sp)              	# [51]  gra_spill_temp_10
	.loc	1	238	0
	s4addl	$20,$20,$20            	# [52]  
	.loc	1	243	0
	ldl	$23,528($sp)              	# [52]  gra_spill_temp_58
	.loc	1	238	0
	addl	$16,$20,$20              	# [53]  
	stl	$0,816($sp)               	# [53]  lgra_spill_temp_94
	.loc	1	243	0
	addl	$26,$13,$11              	# [54]  
	.loc	1	238	0
	stl	$20,208($sp)              	# [54]  gra_spill_temp_18
	.loc	1	243	0
	s8addl	$11,$16,$11            	# [55]  
	addl	$24,$10,$25              	# [55]  
	fldd	$18,-16($25)             	# [56]  id:1613 A_us+0x0
	fldd	$9,0($23)                	# [57]  id:1609 A_bs+0x0
	.loc	1	250	0
	ldl	$28,592($sp)              	# [58]  gra_spill_temp_66
	.loc	1	238	0
	fstd	$21,0($20)               	# [61]  id:1680 slave+0x0
	.loc	1	243	0
	fldd	$19,1104($11)            	# [62]  id:1614 slave+0x0
	fldd	$15,144($11)             	# [63]  id:1611 slave+0x0
	faddd	$18,$19,$18             	# [66]  
	addl	$24,$27,$19              	# [67]  
	fldd	$12,-24($11)             	# [67]  id:1610 slave+0x0
	fldd	$17,-16($19)             	# [68]  id:1612 A_ls+0x0
	fldd	$8,-16($11)              	# [69]  id:1608 slave+0x0
	faddd	$17,$18,$17             	# [73]  
	ldl	$18,704($sp)              	# [74]  gra_spill_temp_80
	faddd	$15,$17,$15             	# [80]  
	.loc	1	250	0
	ldl	$20,568($sp)              	# [81]  gra_spill_temp_63
	.loc	1	243	0
	addl	$26,$18,$17              	# [84]  
	.loc	1	250	0
	ldl	$21,136($sp)              	# [85]  gra_spill_temp_9
	.loc	1	243	0
	s8addl	$17,$16,$17            	# [85]  
	.loc	1	250	0
	fldd	$2,0($28)                	# [86]  id:1619 A_rs+0x0
	.loc	1	243	0
	faddd	$12,$15,$12             	# [87]  
	.loc	1	250	0
	sll	$20,5,$15                 	# [88]  
	.loc	1	243	0
	stl	$19,320($sp)              	# [88]  gra_spill_temp_32
	.loc	1	250	0
	s4addl	$15,$15,$15            	# [89]  
	addl	$21,$13,$0               	# [89]  
	s8addl	$0,$16,$0              	# [90]  
	addl	$15,$10,$7               	# [90]  
	fldd	$7,-160($7)              	# [91]  id:1621 A_us+0x0
	.loc	1	243	0
	faddd	$9,$12,$9               	# [94]  
	.loc	1	250	0
	addl	$21,$18,$12              	# [95]  
	stl	$0,328($sp)               	# [95]  gra_spill_temp_33
	s8addl	$12,$16,$12            	# [96]  
	.loc	1	243	0
	fmuld	$9,$5,$9                	# [101]  
	.loc	1	250	0
	stl	$12,344($sp)              	# [102]  gra_spill_temp_35
	.loc	1	243	0
	fmad	$8,$4,$9,$8              	# [108]  
	fstd	$8,-16($17)              	# [118]  id:1681 slave+0x0
	.loc	1	250	0
	fldd	$8,960($0)               	# [119]  id:1622 slave+0x0
	fldd	$6,-320($0)              	# [120]  id:1620 slave+0x0
	faddd	$7,$8,$7                	# [123]  
	fldd	$22,-152($0)             	# [124]  id:1617 slave+0x0
	faddd	$6,$7,$6                	# [130]  
	fldd	$19,-160($0)             	# [131]  id:1616 slave+0x0
	faddd	$2,$6,$2                	# [137]  
	s8addl	$20,$3,$6              	# [138]  
	fldd	$1,-8($6)                	# [139]  id:1618 A_fs+0x0
	stl	$6,336($sp)               	# [140]  gra_spill_temp_34
	faddd	$1,$2,$1                	# [144]  
	faddd	$22,$1,$22              	# [151]  
	.loc	1	257	0
	addl	$26,$21,$1               	# [151]  
	addl	$1,$13,$6                	# [152]  
	s8addl	$1,$10,$10             	# [152]  
	s8addl	$6,$16,$6              	# [153]  
	fldd	$10,-176($10)            	# [153]  id:1629 A_us+0x0
	stl	$6,352($sp)               	# [154]  gra_spill_temp_36
	.loc	1	250	0
	fmuld	$22,$5,$22              	# [158]  
	fmad	$19,$4,$22,$19           	# [165]  
	.loc	1	257	0
	addl	$1,$18,$22               	# [165]  
	s8addl	$22,$16,$22            	# [166]  
	.loc	1	250	0
	fstd	$19,-160($12)            	# [175]  id:1682 slave+0x0
	.loc	1	257	0
	fldd	$12,944($6)              	# [176]  id:1630 slave+0x0
	fldd	$9,-336($6)              	# [177]  id:1628 slave+0x0
	faddd	$10,$12,$10             	# [180]  
	fldd	$7,-184($6)              	# [181]  id:1626 slave+0x0
	faddd	$9,$10,$9               	# [187]  
	addl	$24,$28,$10              	# [188]  
	fldd	$0,-176($6)              	# [188]  id:1624 slave+0x0
	fldd	$8,-16($10)              	# [189]  id:1627 A_rs+0x0
	stl	$10,368($sp)              	# [190]  gra_spill_temp_38
	faddd	$8,$9,$8                	# [194]  
	.loc	1	266	0
	ldl	$10,560($sp)              	# [195]  gra_spill_temp_62
	.loc	1	257	0
	faddd	$7,$8,$7                	# [201]  
	s8addl	$20,$23,$8             	# [202]  
	stl	$22,360($sp)              	# [202]  gra_spill_temp_37
	fldd	$2,-8($8)                	# [203]  id:1625 A_bs+0x0
	.loc	1	266	0
	addl	$10,$13,$19              	# [205]  
	s8addl	$19,$16,$19            	# [206]  
	.loc	1	257	0
	stl	$8,376($sp)               	# [206]  gra_spill_temp_39
	.loc	1	280	0
	addl	$21,$10,$21              	# [207]  
	.loc	1	257	0
	faddd	$2,$7,$2                	# [209]  
	fmuld	$2,$5,$2                	# [216]  
	fmad	$0,$4,$2,$0              	# [223]  
	.loc	1	266	0
	ldl	$2,608($sp)               	# [223]  gra_spill_temp_68
	fldd	$6,0($2)                 	# [227]  id:1638 A_ds+0x0
	.loc	1	271	0
	addl	$24,$2,$24               	# [227]  
	.loc	1	280	0
	addl	$15,$2,$15               	# [228]  
	.loc	1	257	0
	fstd	$0,-176($22)             	# [233]  id:1683 slave+0x0
	.loc	1	266	0
	fldd	$0,-2240($19)            	# [234]  id:1637 slave+0x0
	fldd	$12,-960($19)            	# [235]  id:1635 slave+0x0
	faddd	$0,$6,$0                	# [238]  
	sll	$14,5,$6                  	# [239]  
	fldd	$8,-1112($19)            	# [239]  id:1633 slave+0x0
	s4addl	$6,$6,$6               	# [240]  
	fldd	$7,-1120($19)            	# [240]  id:1632 slave+0x0
	addl	$6,$27,$22               	# [241]  
	.loc	1	280	0
	fldd	$15,-160($15)            	# [241]  id:1654 A_ds+0x0
	.loc	1	266	0
	fldd	$22,-160($22)            	# [242]  id:1636 A_ls+0x0
	.loc	1	280	0
	addl	$6,$28,$6                	# [242]  
	fldd	$6,-160($6)              	# [243]  id:1651 A_rs+0x0
	.loc	1	266	0
	faddd	$22,$0,$22              	# [246]  
	s4subl	$14,$14,$0             	# [247]  
	faddd	$12,$22,$12             	# [253]  
	sll	$0,4,$0                   	# [254]  
	addl	$10,$18,$22              	# [254]  
	s8addl	$14,$0,$0              	# [255]  
	s8addl	$22,$16,$22            	# [255]  
	addl	$0,$3,$9                 	# [256]  
	.loc	1	271	0
	addl	$0,$23,$0                	# [256]  
	.loc	1	266	0
	fldd	$9,-56($9)               	# [257]  id:1634 A_fs+0x0
	.loc	1	271	0
	fldd	$0,-56($0)               	# [258]  id:1641 A_bs+0x0
	.loc	1	266	0
	faddd	$9,$12,$9               	# [261]  
	.loc	1	271	0
	addl	$26,$10,$12              	# [262]  
	.loc	1	289	0
	addl	$1,$10,$10               	# [262]  
	s8addl	$1,$2,$1               	# [263]  
	.loc	1	266	0
	faddd	$8,$9,$8                	# [268]  
	.loc	1	271	0
	fldd	$9,-16($24)              	# [269]  id:1646 A_ds+0x0
	.loc	1	266	0
	fmuld	$8,$5,$8                	# [275]  
	.loc	1	289	0
	fldd	$1,-176($1)              	# [276]  id:1662 A_ds+0x0
	.loc	1	266	0
	fmad	$7,$4,$8,$7              	# [282]  
	.loc	1	271	0
	addl	$12,$13,$8               	# [283]  
	addl	$12,$18,$12              	# [283]  
	s8addl	$8,$16,$8              	# [284]  
	s8addl	$12,$16,$12            	# [284]  
	.loc	1	266	0
	fstd	$7,-1120($22)            	# [292]  id:1684 slave+0x0
	.loc	1	271	0
	fldd	$7,-2256($8)             	# [293]  id:1645 slave+0x0
	faddd	$7,$9,$7                	# [297]  
	ldl	$9,152($sp)               	# [297]  gra_spill_temp_11
	addl	$26,$9,$26               	# [301]  
	fldd	$9,-976($8)              	# [301]  id:1643 slave+0x0
	s8addl	$26,$27,$27            	# [302]  
	.loc	1	289	0
	s8addl	$26,$28,$26            	# [302]  
	.loc	1	271	0
	fldd	$27,-176($27)            	# [303]  id:1644 A_ls+0x0
	.loc	1	289	0
	fldd	$26,-176($26)            	# [304]  id:1659 A_rs+0x0
	.loc	1	271	0
	faddd	$27,$7,$27              	# [307]  
	fldd	$7,-1144($8)             	# [308]  id:1642 slave+0x0
	faddd	$9,$27,$9               	# [314]  
	fldd	$27,-1136($8)            	# [315]  id:1640 slave+0x0
	faddd	$7,$9,$7                	# [321]  
	faddd	$0,$7,$0                	# [328]  
	fmuld	$0,$5,$0                	# [335]  
	fmad	$27,$4,$0,$27            	# [342]  
	fstd	$27,-1136($12)           	# [352]  id:1685 slave+0x0
	.loc	1	280	0
	addl	$21,$13,$27              	# [352]  
	s8addl	$27,$16,$27            	# [353]  
	addl	$21,$18,$21              	# [353]  
	fldd	$9,-2400($27)            	# [354]  id:1653 slave+0x0
	s8addl	$21,$16,$21            	# [354]  
	fldd	$7,-1440($27)            	# [355]  id:1652 slave+0x0
	.loc	1	289	0
	addl	$10,$13,$13              	# [355]  
	.loc	1	280	0
	fldd	$0,-1272($27)            	# [356]  id:1649 slave+0x0
	.loc	1	289	0
	s8addl	$13,$16,$13            	# [356]  
	.loc	1	280	0
	fldd	$27,-1280($27)           	# [357]  id:1648 slave+0x0
	.loc	1	289	0
	addl	$10,$18,$10              	# [357]  
	.loc	1	280	0
	faddd	$9,$15,$9               	# [358]  
	s8subl	$14,$14,$15            	# [358]  
	addl	$20,$15,$20              	# [359]  
	.loc	1	289	0
	s8addl	$10,$16,$10            	# [359]  
	.loc	1	280	0
	s8addl	$20,$3,$3              	# [360]  
	.loc	1	289	0
	s8addl	$20,$23,$20            	# [360]  
	.loc	1	280	0
	fldd	$3,-64($3)               	# [361]  id:1650 A_fs+0x0
	faddd	$7,$9,$7                	# [365]  
	.loc	1	289	0
	fldd	$20,-64($20)             	# [366]  id:1657 A_bs+0x0
	.loc	1	280	0
	faddd	$6,$7,$6                	# [372]  
	.loc	1	289	0
	ldl	$9,632($sp)               	# [373]  gra_spill_temp_71
	.loc	1	280	0
	faddd	$3,$6,$3                	# [379]  
	faddd	$0,$3,$0                	# [386]  
	fmuld	$0,$5,$0                	# [393]  
	fmad	$27,$4,$0,$27            	# [400]  
	fstd	$27,-1280($21)           	# [410]  id:1686 slave+0x0
	.loc	1	289	0
	fldd	$0,-2416($13)            	# [411]  id:1661 slave+0x0
	fldd	$27,-1456($13)           	# [412]  id:1660 slave+0x0
	faddd	$0,$1,$0                	# [415]  
	fldd	$21,-1304($13)           	# [416]  id:1658 slave+0x0
	faddd	$27,$0,$27              	# [422]  
	fldd	$13,-1296($13)           	# [423]  id:1656 slave+0x0
	faddd	$26,$27,$26             	# [429]  
	faddd	$21,$26,$21             	# [436]  
	faddd	$20,$21,$20             	# [443]  
	fmuld	$20,$5,$20              	# [450]  
	fmad	$13,$4,$20,$13           	# [457]  
	fstd	$13,-1296($10)           	# [467]  id:1687 slave+0x0
#<bpre> branch predict taken
	br .Lt_1_250.bpre1
.Lt_1_312.bpre.Lt_1_250:
	br .Lt_1_312
.Lt_1_250.bpre1:
	bne	$9,.Lt_1_312.bpre.Lt_1_250 	# [468]  
#Block: 315 Pred: 151 Succ: 157 
.L_BB315_stencil_core:	# 0x1dd4
#<freq>
#<freq> BB:315 frequency = 0.09101 (heuristic)
#<freq>
	br	$31,.Lt_1_260              	# [0]  
#Block: 141 Pred: 130 Succ: 143 139 
.Lt_1_237:	# 0x1dd8
#<freq>
#<freq> BB:141 frequency = 0.05970 (heuristic)
#<freq> BB:141 => BB:143 probability = 0.13483
#<freq> BB:141 => BB:139 probability = 0.86517
#<freq>
	.loc	1	231	0
	ldl	$1,576($sp)               	# [0]  gra_spill_temp_64
	stl	$31,696($sp)              	# [1]  gra_spill_temp_79
#<bpre> branch predict taken
	bne	$1,.Lt_1_311              	# [4]  
#Block: 143 Pred: 138 141 Succ: 144 157 
.Lt_1_331:	# 0x1de4
.Lt_1_249:	# 0x1de4
#<freq>
#<freq> BB:143 frequency = 0.43118 (heuristic)
#<freq> BB:143 => BB:144 probability = 0.92799
#<freq> BB:143 => BB:157 probability = 0.07201
#<freq>
	.loc	1	238	0
	ldl	$21,424($sp)              	# [0]  gra_spill_temp_45
	ldl	$10,600($sp)              	# [1]  gra_spill_temp_67
	ldl	$27,584($sp)              	# [2]  gra_spill_temp_65
	ldl	$3,536($sp)               	# [3]  gra_spill_temp_59
	fldd	$28,1120($21)            	# [4]  id:1605 slave+0x0
	fldd	$26,0($10)               	# [5]  id:1606 A_us+0x0
	fldd	$25,0($27)               	# [6]  id:1604 A_ls+0x0
	faddd	$26,$28,$26             	# [9]  
	fldd	$24,160($21)             	# [10]  id:1603 slave+0x0
	faddd	$25,$26,$25             	# [16]  
	fldd	$23,0($3)                	# [17]  id:1602 A_fs+0x0
	faddd	$24,$25,$24             	# [23]  
	fldd	$22,8($21)               	# [24]  id:1601 slave+0x0
	faddd	$23,$24,$23             	# [30]  
	fldd	$21,0($21)               	# [31]  id:1600 slave+0x0
	faddd	$22,$23,$22             	# [37]  
	ldl	$20,272($sp)              	# [38]  gra_spill_temp_26
	fmuld	$22,$5,$22              	# [44]  
	.loc	1	243	0
	ldl	$26,664($sp)              	# [45]  gra_spill_temp_75
	.loc	1	238	0
	sll	$20,5,$20                 	# [48]  
	ldl	$16,712($sp)              	# [49]  gra_spill_temp_81
	s8subl	$20,$20,$20            	# [49]  
	.loc	1	243	0
	ldl	$13,720($sp)              	# [50]  gra_spill_temp_82
	.loc	1	238	0
	s8subl	$20,$20,$20            	# [50]  
	fmad	$21,$4,$22,$21           	# [51]  
	.loc	1	243	0
	ldl	$24,144($sp)              	# [51]  gra_spill_temp_10
	.loc	1	238	0
	s4addl	$20,$20,$20            	# [52]  
	.loc	1	243	0
	ldl	$23,528($sp)              	# [52]  gra_spill_temp_58
	.loc	1	238	0
	addl	$16,$20,$20              	# [53]  
	stl	$0,816($sp)               	# [53]  lgra_spill_temp_94
	.loc	1	243	0
	addl	$26,$13,$11              	# [54]  
	.loc	1	238	0
	stl	$20,208($sp)              	# [54]  gra_spill_temp_18
	.loc	1	243	0
	s8addl	$11,$16,$11            	# [55]  
	addl	$24,$10,$25              	# [55]  
	fldd	$18,-16($25)             	# [56]  id:1613 A_us+0x0
	fldd	$9,0($23)                	# [57]  id:1609 A_bs+0x0
	.loc	1	250	0
	ldl	$28,592($sp)              	# [58]  gra_spill_temp_66
	.loc	1	238	0
	fstd	$21,0($20)               	# [61]  id:1607 slave+0x0
	.loc	1	243	0
	fldd	$19,1104($11)            	# [62]  id:1614 slave+0x0
	fldd	$15,144($11)             	# [63]  id:1611 slave+0x0
	faddd	$18,$19,$18             	# [66]  
	addl	$24,$27,$19              	# [67]  
	fldd	$12,-24($11)             	# [67]  id:1610 slave+0x0
	fldd	$17,-16($19)             	# [68]  id:1612 A_ls+0x0
	fldd	$8,-16($11)              	# [69]  id:1608 slave+0x0
	faddd	$17,$18,$17             	# [73]  
	ldl	$18,704($sp)              	# [74]  gra_spill_temp_80
	faddd	$15,$17,$15             	# [80]  
	.loc	1	250	0
	ldl	$20,568($sp)              	# [81]  gra_spill_temp_63
	.loc	1	243	0
	addl	$26,$18,$17              	# [84]  
	.loc	1	250	0
	ldl	$21,136($sp)              	# [85]  gra_spill_temp_9
	.loc	1	243	0
	s8addl	$17,$16,$17            	# [85]  
	.loc	1	250	0
	fldd	$2,0($28)                	# [86]  id:1619 A_rs+0x0
	.loc	1	243	0
	faddd	$12,$15,$12             	# [87]  
	.loc	1	250	0
	sll	$20,5,$15                 	# [88]  
	.loc	1	243	0
	stl	$19,320($sp)              	# [88]  gra_spill_temp_32
	.loc	1	250	0
	s4addl	$15,$15,$15            	# [89]  
	addl	$21,$13,$0               	# [89]  
	s8addl	$0,$16,$0              	# [90]  
	addl	$15,$10,$7               	# [90]  
	fldd	$7,-160($7)              	# [91]  id:1621 A_us+0x0
	.loc	1	243	0
	faddd	$9,$12,$9               	# [94]  
	.loc	1	250	0
	addl	$21,$18,$12              	# [95]  
	stl	$0,328($sp)               	# [95]  gra_spill_temp_33
	s8addl	$12,$16,$12            	# [96]  
	.loc	1	243	0
	fmuld	$9,$5,$9                	# [101]  
	.loc	1	250	0
	stl	$12,344($sp)              	# [102]  gra_spill_temp_35
	.loc	1	243	0
	fmad	$8,$4,$9,$8              	# [108]  
	fstd	$8,-16($17)              	# [118]  id:1615 slave+0x0
	.loc	1	250	0
	fldd	$8,960($0)               	# [119]  id:1622 slave+0x0
	fldd	$6,-320($0)              	# [120]  id:1620 slave+0x0
	faddd	$7,$8,$7                	# [123]  
	fldd	$22,-152($0)             	# [124]  id:1617 slave+0x0
	faddd	$6,$7,$6                	# [130]  
	fldd	$19,-160($0)             	# [131]  id:1616 slave+0x0
	faddd	$2,$6,$2                	# [137]  
	s8addl	$20,$3,$6              	# [138]  
	fldd	$1,-8($6)                	# [139]  id:1618 A_fs+0x0
	stl	$6,336($sp)               	# [140]  gra_spill_temp_34
	faddd	$1,$2,$1                	# [144]  
	faddd	$22,$1,$22              	# [151]  
	.loc	1	257	0
	addl	$26,$21,$1               	# [151]  
	addl	$1,$13,$6                	# [152]  
	s8addl	$1,$10,$10             	# [152]  
	s8addl	$6,$16,$6              	# [153]  
	fldd	$10,-176($10)            	# [153]  id:1629 A_us+0x0
	stl	$6,352($sp)               	# [154]  gra_spill_temp_36
	.loc	1	250	0
	fmuld	$22,$5,$22              	# [158]  
	fmad	$19,$4,$22,$19           	# [165]  
	.loc	1	257	0
	addl	$1,$18,$22               	# [165]  
	s8addl	$22,$16,$22            	# [166]  
	.loc	1	250	0
	fstd	$19,-160($12)            	# [175]  id:1623 slave+0x0
	.loc	1	257	0
	fldd	$12,944($6)              	# [176]  id:1630 slave+0x0
	fldd	$9,-336($6)              	# [177]  id:1628 slave+0x0
	faddd	$10,$12,$10             	# [180]  
	fldd	$7,-184($6)              	# [181]  id:1626 slave+0x0
	faddd	$9,$10,$9               	# [187]  
	addl	$24,$28,$10              	# [188]  
	fldd	$0,-176($6)              	# [188]  id:1624 slave+0x0
	fldd	$8,-16($10)              	# [189]  id:1627 A_rs+0x0
	stl	$10,368($sp)              	# [190]  gra_spill_temp_38
	faddd	$8,$9,$8                	# [194]  
	.loc	1	266	0
	ldl	$10,560($sp)              	# [195]  gra_spill_temp_62
	.loc	1	257	0
	faddd	$7,$8,$7                	# [201]  
	s8addl	$20,$23,$8             	# [202]  
	stl	$22,360($sp)              	# [202]  gra_spill_temp_37
	fldd	$2,-8($8)                	# [203]  id:1625 A_bs+0x0
	.loc	1	266	0
	addl	$10,$13,$19              	# [205]  
	s8addl	$19,$16,$19            	# [206]  
	.loc	1	257	0
	stl	$8,376($sp)               	# [206]  gra_spill_temp_39
	.loc	1	280	0
	addl	$21,$10,$21              	# [207]  
	.loc	1	257	0
	faddd	$2,$7,$2                	# [209]  
	fmuld	$2,$5,$2                	# [216]  
	fmad	$0,$4,$2,$0              	# [223]  
	.loc	1	266	0
	ldl	$2,608($sp)               	# [223]  gra_spill_temp_68
	fldd	$6,0($2)                 	# [227]  id:1638 A_ds+0x0
	.loc	1	271	0
	addl	$24,$2,$24               	# [227]  
	.loc	1	280	0
	addl	$15,$2,$15               	# [228]  
	.loc	1	257	0
	fstd	$0,-176($22)             	# [233]  id:1631 slave+0x0
	.loc	1	266	0
	fldd	$0,-2240($19)            	# [234]  id:1637 slave+0x0
	fldd	$12,-960($19)            	# [235]  id:1635 slave+0x0
	faddd	$0,$6,$0                	# [238]  
	sll	$14,5,$6                  	# [239]  
	fldd	$8,-1112($19)            	# [239]  id:1633 slave+0x0
	s4addl	$6,$6,$6               	# [240]  
	fldd	$7,-1120($19)            	# [240]  id:1632 slave+0x0
	addl	$6,$27,$22               	# [241]  
	.loc	1	280	0
	fldd	$15,-160($15)            	# [241]  id:1654 A_ds+0x0
	.loc	1	266	0
	fldd	$22,-160($22)            	# [242]  id:1636 A_ls+0x0
	.loc	1	280	0
	addl	$6,$28,$6                	# [242]  
	fldd	$6,-160($6)              	# [243]  id:1651 A_rs+0x0
	.loc	1	266	0
	faddd	$22,$0,$22              	# [246]  
	s4subl	$14,$14,$0             	# [247]  
	faddd	$12,$22,$12             	# [253]  
	sll	$0,4,$0                   	# [254]  
	addl	$10,$18,$22              	# [254]  
	s8addl	$14,$0,$0              	# [255]  
	s8addl	$22,$16,$22            	# [255]  
	addl	$0,$3,$9                 	# [256]  
	.loc	1	271	0
	addl	$0,$23,$0                	# [256]  
	.loc	1	266	0
	fldd	$9,-56($9)               	# [257]  id:1634 A_fs+0x0
	.loc	1	271	0
	fldd	$0,-56($0)               	# [258]  id:1641 A_bs+0x0
	.loc	1	266	0
	faddd	$9,$12,$9               	# [261]  
	.loc	1	271	0
	addl	$26,$10,$12              	# [262]  
	.loc	1	289	0
	addl	$1,$10,$10               	# [262]  
	s8addl	$1,$2,$1               	# [263]  
	.loc	1	266	0
	faddd	$8,$9,$8                	# [268]  
	.loc	1	271	0
	fldd	$9,-16($24)              	# [269]  id:1646 A_ds+0x0
	.loc	1	266	0
	fmuld	$8,$5,$8                	# [275]  
	.loc	1	289	0
	fldd	$1,-176($1)              	# [276]  id:1662 A_ds+0x0
	.loc	1	266	0
	fmad	$7,$4,$8,$7              	# [282]  
	.loc	1	271	0
	addl	$12,$13,$8               	# [283]  
	addl	$12,$18,$12              	# [283]  
	s8addl	$8,$16,$8              	# [284]  
	s8addl	$12,$16,$12            	# [284]  
	.loc	1	266	0
	fstd	$7,-1120($22)            	# [292]  id:1639 slave+0x0
	.loc	1	271	0
	fldd	$7,-2256($8)             	# [293]  id:1645 slave+0x0
	faddd	$7,$9,$7                	# [297]  
	ldl	$9,152($sp)               	# [297]  gra_spill_temp_11
	addl	$26,$9,$26               	# [301]  
	fldd	$9,-976($8)              	# [301]  id:1643 slave+0x0
	s8addl	$26,$27,$27            	# [302]  
	.loc	1	289	0
	s8addl	$26,$28,$26            	# [302]  
	.loc	1	271	0
	fldd	$27,-176($27)            	# [303]  id:1644 A_ls+0x0
	.loc	1	289	0
	fldd	$26,-176($26)            	# [304]  id:1659 A_rs+0x0
	.loc	1	271	0
	faddd	$27,$7,$27              	# [307]  
	fldd	$7,-1144($8)             	# [308]  id:1642 slave+0x0
	faddd	$9,$27,$9               	# [314]  
	fldd	$27,-1136($8)            	# [315]  id:1640 slave+0x0
	faddd	$7,$9,$7                	# [321]  
	faddd	$0,$7,$0                	# [328]  
	fmuld	$0,$5,$0                	# [335]  
	fmad	$27,$4,$0,$27            	# [342]  
	fstd	$27,-1136($12)           	# [352]  id:1647 slave+0x0
	.loc	1	280	0
	addl	$21,$13,$27              	# [352]  
	s8addl	$27,$16,$27            	# [353]  
	addl	$21,$18,$21              	# [353]  
	fldd	$9,-2400($27)            	# [354]  id:1653 slave+0x0
	s8addl	$21,$16,$21            	# [354]  
	fldd	$7,-1440($27)            	# [355]  id:1652 slave+0x0
	.loc	1	289	0
	addl	$10,$13,$13              	# [355]  
	.loc	1	280	0
	fldd	$0,-1272($27)            	# [356]  id:1649 slave+0x0
	.loc	1	289	0
	s8addl	$13,$16,$13            	# [356]  
	.loc	1	280	0
	fldd	$27,-1280($27)           	# [357]  id:1648 slave+0x0
	.loc	1	289	0
	addl	$10,$18,$10              	# [357]  
	.loc	1	280	0
	faddd	$9,$15,$9               	# [358]  
	s8subl	$14,$14,$15            	# [358]  
	addl	$20,$15,$20              	# [359]  
	.loc	1	289	0
	s8addl	$10,$16,$10            	# [359]  
	.loc	1	280	0
	s8addl	$20,$3,$3              	# [360]  
	.loc	1	289	0
	s8addl	$20,$23,$20            	# [360]  
	.loc	1	280	0
	fldd	$3,-64($3)               	# [361]  id:1650 A_fs+0x0
	faddd	$7,$9,$7                	# [365]  
	.loc	1	289	0
	fldd	$20,-64($20)             	# [366]  id:1657 A_bs+0x0
	.loc	1	280	0
	faddd	$6,$7,$6                	# [372]  
	.loc	1	289	0
	ldl	$9,632($sp)               	# [373]  gra_spill_temp_71
	.loc	1	280	0
	faddd	$3,$6,$3                	# [379]  
	faddd	$0,$3,$0                	# [386]  
	fmuld	$0,$5,$0                	# [393]  
	fmad	$27,$4,$0,$27            	# [400]  
	fstd	$27,-1280($21)           	# [410]  id:1655 slave+0x0
	.loc	1	289	0
	fldd	$0,-2416($13)            	# [411]  id:1661 slave+0x0
	fldd	$27,-1456($13)           	# [412]  id:1660 slave+0x0
	faddd	$0,$1,$0                	# [415]  
	fldd	$21,-1304($13)           	# [416]  id:1658 slave+0x0
	faddd	$27,$0,$27              	# [422]  
	fldd	$13,-1296($13)           	# [423]  id:1656 slave+0x0
	faddd	$26,$27,$26             	# [429]  
	faddd	$21,$26,$21             	# [436]  
	faddd	$20,$21,$20             	# [443]  
	fmuld	$20,$5,$20              	# [450]  
	fmad	$13,$4,$20,$13           	# [457]  
	fstd	$13,-1296($10)           	# [467]  id:1663 slave+0x0
#<bpre> branch predict not taken
	beq	$9,.Lt_1_260              	# [468]  
#Block: 144 Pred: 143 151 Succ: 266 
.Lt_1_312:	# 0x213c
#<freq>
#<freq> BB:144 frequency = 0.87794 (heuristic)
#<freq>
	ldl	$7,720($sp)               	# [0]  gra_spill_temp_82
	mov	$11,$21                   	# [0]  
	ldl	$10,712($sp)              	# [1]  gra_spill_temp_81
	mov	$17,$20                   	# [1]  
	ldl	$27,704($sp)              	# [2]  gra_spill_temp_80
	s8addl	$7,$10,$7              	# [5]  
	ldl	$9,536($sp)               	# [6]  gra_spill_temp_59
	s8addl	$27,$10,$27            	# [9]  
	ldl	$28,528($sp)              	# [10]  gra_spill_temp_58
	mov	$31,$10                   	# [10]  
	ldl	$6,568($sp)               	# [11]  gra_spill_temp_63
	s8addl	$15,$9,$23             	# [13]  
	ldl	$18,600($sp)              	# [14]  gra_spill_temp_67
	s8addl	$15,$28,$16            	# [14]  
	ldl	$13,608($sp)              	# [15]  gra_spill_temp_68
	subw	$6,2,$6                  	# [17]  
#Block: 266 Pred: 144 Succ: 156 
.L_BB266_stencil_core:	# 0x217c
#<freq>
#<freq> BB:266 frequency = 0.87794 (heuristic)
#<freq>
	.loc	1	302	0
# 298    //10.1 compute up and down line of j dimensional  change 
# 299    for(j = 1;j < j_region; ++j)
# 300    {
# 301    //front face
# 302      slave[lhs_no][0][j][0] = alpha_d * slave[rhs_no][0][j][0] + \
	fldd	$15,160($7)              	# [0]  
	stl	$17,800($sp)              	# [1]  gra_spill_temp_92
	stl	$11,792($sp)              	# [2]  gra_spill_temp_91
#Block: 156 Pred: 156 266 Succ: 267 156 
	.align	4
.Lt_1_264:	# 0x2188
#<loop> Loop body line 289, nesting depth: 1, estimated iterations: 5
#<freq>
#<freq> BB:156 frequency = 4.38969 (heuristic)
#<freq> BB:156 => BB:267 probability = 0.20000
#<freq> BB:156 => BB:156 probability = 0.80000
#<freq>
	fldd	$1,1280($7)              	# [0]  id:1694 slave+0x0
	mov	$15,$2                    	# [0]  
	fldd	$26,160($18)             	# [1]  id:1693 A_us+0x0
	.loc	1	315	0
# 311      slave[lhs_no][0][j][k_region] = alpha_d * slave[rhs_no][0][j][k_region] + \
# 312                       beta_d * (A_us[j][k_region] + slave[rhs_no][1][j][k_region] +\
# 313                       slave[rhs_no][0][j-1][k_region] + slave[rhs_no][0][j+1][k_region]+\
# 314                       slave[rhs_no][0][j][k_k] + A_bs[0][j]);
# 315      slave[lhs_no][i_region][j][k_region] =  alpha_d * slave[rhs_no][i_region][j][k_region] + \
	addw	$10,1,$10                	# [1]  
	.loc	1	302	0
	fldd	$17,0($7)                	# [2]  id:1692 slave+0x0
	.loc	1	315	0
	ldi	$18,160($18)              	# [2]  
	.loc	1	302	0
	fldd	$15,320($7)              	# [3]  id:1691 slave+0x0
	faddd	$26,$1,$26              	# [5]  
	fldd	$11,8($9)                	# [6]  id:1690 A_fs+0x0
	.loc	1	315	0
	ldi	$9,8($9)                  	# [6]  
	.loc	1	302	0
	fldd	$3,168($7)               	# [7]  id:1689 slave+0x0
	.loc	1	315	0
	ldi	$7,160($7)                	# [7]  
	.loc	1	306	0
	fldd	$1,160($13)              	# [8]  id:1702 A_ds+0x0
	.loc	1	315	0
	ldi	$13,160($13)              	# [8]  
	.loc	1	302	0
	faddd	$17,$26,$17             	# [12]  
	faddd	$15,$17,$17             	# [19]  
	faddd	$11,$17,$11             	# [26]  
	.loc	1	306	0
	fldd	$17,-1120($19)           	# [26]  id:1700 slave+0x0
	.loc	1	302	0
	faddd	$3,$11,$3               	# [33]  
	.loc	1	306	0
	fldd	$11,-800($19)            	# [33]  id:1699 slave+0x0
	.loc	1	302	0
	fmuld	$3,$5,$3                	# [40]  
	fmad	$2,$4,$3,$2              	# [47]  
	.loc	1	306	0
	fldd	$3,-48($23)              	# [47]  id:1698 A_fs+0x0
	.loc	1	315	0
	ldi	$23,8($23)                	# [48]  
	.loc	1	302	0
	fstd	$2,160($27)              	# [57]  id:1695 slave+0x0
	.loc	1	306	0
	fldd	$26,-2080($19)           	# [58]  id:1701 slave+0x0
	.loc	1	315	0
	ldi	$27,160($27)              	# [58]  
	.loc	1	306	0
	fldd	$2,-952($19)             	# [59]  id:1697 slave+0x0
	faddd	$26,$1,$26              	# [62]  
	fldd	$1,-960($19)             	# [63]  id:1696 slave+0x0
	.loc	1	315	0
	ldi	$19,160($19)              	# [63]  
	.loc	1	306	0
	faddd	$17,$26,$17             	# [69]  
	faddd	$11,$17,$11             	# [76]  
	.loc	1	311	0
	fldd	$17,144($25)             	# [76]  id:1709 A_us+0x0
	.loc	1	315	0
	ldi	$25,160($25)              	# [77]  
	.loc	1	306	0
	faddd	$3,$11,$3               	# [83]  
	.loc	1	311	0
	fldd	$11,-16($21)             	# [84]  id:1708 slave+0x0
	.loc	1	306	0
	faddd	$2,$3,$2                	# [90]  
	.loc	1	311	0
	fldd	$3,304($21)              	# [91]  id:1707 slave+0x0
	.loc	1	306	0
	fmuld	$2,$5,$2                	# [97]  
	fmad	$1,$4,$2,$1              	# [104]  
	fstd	$1,-960($22)             	# [114]  id:1703 slave+0x0
	.loc	1	315	0
	ldi	$22,160($22)              	# [114]  
	.loc	1	311	0
	fldd	$26,1264($21)            	# [115]  id:1710 slave+0x0
	fldd	$2,136($21)              	# [116]  id:1706 slave+0x0
	faddd	$17,$26,$17             	# [119]  
	fldd	$1,8($28)                	# [120]  id:1705 A_bs+0x0
	.loc	1	315	0
	ldi	$28,8($28)                	# [120]  
	.loc	1	311	0
	fldd	$26,144($21)             	# [121]  id:1704 slave+0x0
	.loc	1	315	0
	ldi	$21,160($21)              	# [121]  
	.loc	1	311	0
	faddd	$11,$17,$11             	# [126]  
	.loc	1	315	0
	fldd	$17,144($24)             	# [126]  id:1718 A_ds+0x0
	ldi	$24,160($24)              	# [127]  
	.loc	1	311	0
	faddd	$3,$11,$3               	# [133]  
	faddd	$2,$3,$2                	# [140]  
	.loc	1	315	0
	fldd	$3,-1136($8)             	# [140]  id:1716 slave+0x0
	.loc	1	311	0
	faddd	$1,$2,$1                	# [147]  
	.loc	1	315	0
	fldd	$2,-816($8)              	# [147]  id:1715 slave+0x0
	.loc	1	311	0
	fmuld	$1,$5,$1                	# [154]  
	fmad	$26,$4,$1,$26            	# [161]  
	.loc	1	315	0
	fldd	$1,-984($8)              	# [161]  id:1714 slave+0x0
	.loc	1	311	0
	fstd	$26,144($20)             	# [171]  id:1711 slave+0x0
	.loc	1	315	0
	ldi	$20,160($20)              	# [171]  
	fldd	$11,-2096($8)            	# [172]  id:1717 slave+0x0
	fldd	$26,-48($16)             	# [173]  id:1713 A_bs+0x0
	ldi	$16,8($16)                	# [173]  
	faddd	$11,$17,$11             	# [176]  
	fldd	$17,-976($8)             	# [176]  id:1712 slave+0x0
	ldi	$8,160($8)                	# [177]  
	faddd	$3,$11,$3               	# [183]  
	cmpeq	$10,$6,$11              	# [184]  
	faddd	$2,$3,$2                	# [190]  
	faddd	$1,$2,$1                	# [197]  
	faddd	$26,$1,$26              	# [204]  
	fmuld	$26,$5,$26              	# [211]  
	fmad	$17,$4,$26,$17           	# [218]  
	fstd	$17,-976($12)            	# [228]  id:1719 slave+0x0
	ldi	$12,160($12)              	# [228]  
#<bpre> branch predict taken
	beq	$11,.Lt_1_264             	# [229]  
#Block: 267 Pred: 156 Succ: 157 
.L_BB267_stencil_core:	# 0x22c4
#<freq>
#<freq> BB:267 frequency = 0.87794 (heuristic)
#<freq>
	ldl	$11,792($sp)              	# [0]  gra_spill_temp_91
	ldl	$17,800($sp)              	# [1]  gra_spill_temp_92
#Block: 157 Pred: 143 267 315 Succ: 158 161 
.Lt_1_260:	# 0x22cc
#<freq>
#<freq> BB:157 frequency = 1.00000 (heuristic)
#<freq> BB:157 => BB:158 probability = 0.92799
#<freq> BB:157 => BB:161 probability = 0.07201
#<freq>
	ldl	$2,552($sp)               	# [0]  gra_spill_temp_61
#<bpre> branch predict not taken
	beq	$2,.Lt_1_266              	# [4]  
#Block: 158 Pred: 157 Succ: 268 
.L_BB158_stencil_core:	# 0x22d4
#<freq>
#<freq> BB:158 frequency = 0.92799 (heuristic)
#<freq>
	ldl	$6,720($sp)               	# [0]  gra_spill_temp_82
	mov	$11,$21                   	# [0]  
	ldl	$8,712($sp)               	# [1]  gra_spill_temp_81
	mov	$17,$20                   	# [1]  
	ldl	$27,704($sp)              	# [2]  gra_spill_temp_80
	subw	$14,2,$12                	# [2]  
	ldl	$9,536($sp)               	# [3]  gra_spill_temp_59
	s8addl	$6,$8,$6               	# [5]  
	ldl	$28,528($sp)              	# [6]  gra_spill_temp_58
	s8addl	$27,$8,$27             	# [6]  
	ldl	$13,584($sp)              	# [7]  gra_spill_temp_65
	mov	$31,$8                    	# [7]  
	ldl	$18,592($sp)              	# [8]  gra_spill_temp_66
	ldl	$25,336($sp)              	# [9]  gra_spill_temp_34
	ldl	$24,376($sp)              	# [10]  gra_spill_temp_39
	ldl	$23,320($sp)              	# [11]  gra_spill_temp_32
	ldl	$22,368($sp)              	# [12]  gra_spill_temp_38
	ldl	$19,328($sp)              	# [13]  gra_spill_temp_33
	ldl	$16,344($sp)              	# [14]  gra_spill_temp_35
	ldl	$10,352($sp)              	# [15]  gra_spill_temp_36
	ldl	$7,360($sp)               	# [16]  gra_spill_temp_37
#Block: 268 Pred: 158 Succ: 160 
.L_BB268_stencil_core:	# 0x2328
#<freq>
#<freq> BB:268 frequency = 0.92799 (heuristic)
#<freq>
	.loc	1	324	0
# 320    //10.2 compute left and right line of i dimensional change
# 321    for(i = 1;i < i_region; ++i)
# 322    {
# 323     //front face
# 324      slave[lhs_no][i][0][0] = alpha_d * slave[rhs_no][i][0][0] + \
	fldd	$15,1120($6)             	# [0]  
#Block: 160 Pred: 160 268 Succ: 269 160 
	.align	4
.Lt_1_270:	# 0x232c
#<loop> Loop body line 315, nesting depth: 1, estimated iterations: 5
#<freq>
#<freq> BB:160 frequency = 4.63993 (heuristic)
#<freq> BB:160 => BB:269 probability = 0.20000
#<freq> BB:160 => BB:160 probability = 0.80000
#<freq>
	fldd	$2,0($6)                 	# [0]  id:1725 slave+0x0
	mov	$15,$3                    	# [0]  
	fldd	$15,2240($6)             	# [1]  id:1726 slave+0x0
	.loc	1	337	0
# 333      slave[lhs_no][i][0][k_region] = alpha_d * slave[rhs_no][i][0][k_region] + \
# 334                       beta_d * (slave[rhs_no][i-1][0][k_region] + slave[rhs_no][i+1][0][k_region] +\
# 335                       A_ls[i][k_region] + slave[rhs_no][i][1][k_region]+\
# 336                       slave[rhs_no][i][0][k_k] + A_bs[i][0]); 
# 337      slave[lhs_no][i][j_region][k_region] = alpha_d * slave[rhs_no][i][j_region][k_region] + \
	addw	$8,1,$8                  	# [1]  
	.loc	1	324	0
	fldd	$1,160($13)              	# [2]  id:1724 A_ls+0x0
	.loc	1	337	0
	ldi	$13,160($13)              	# [2]  
	.loc	1	324	0
	fldd	$26,1280($6)             	# [3]  id:1723 slave+0x0
	faddd	$2,$15,$2               	# [5]  
	fldd	$17,56($9)               	# [6]  id:1722 A_fs+0x0
	.loc	1	337	0
	ldi	$9,56($9)                 	# [6]  
	.loc	1	324	0
	fldd	$11,1128($6)             	# [7]  id:1721 slave+0x0
	.loc	1	337	0
	ldi	$6,1120($6)               	# [7]  
	.loc	1	324	0
	faddd	$1,$2,$1                	# [12]  
	.loc	1	328	0
	fldd	$2,-160($19)             	# [12]  id:1733 slave+0x0
	.loc	1	324	0
	faddd	$26,$1,$26              	# [19]  
	faddd	$17,$26,$17             	# [26]  
	.loc	1	328	0
	fldd	$26,160($18)             	# [26]  id:1731 A_rs+0x0
	.loc	1	337	0
	ldi	$18,160($18)              	# [27]  
	.loc	1	324	0
	faddd	$11,$17,$11             	# [33]  
	.loc	1	328	0
	fldd	$17,48($25)              	# [34]  id:1730 A_fs+0x0
	.loc	1	337	0
	ldi	$25,56($25)               	# [34]  
	.loc	1	324	0
	fmuld	$11,$5,$11              	# [40]  
	fmad	$3,$4,$11,$3             	# [47]  
	.loc	1	328	0
	fldd	$11,2080($19)            	# [47]  id:1734 slave+0x0
	faddd	$2,$11,$2               	# [51]  
	fldd	$11,968($19)             	# [51]  id:1729 slave+0x0
	.loc	1	324	0
	fstd	$3,1120($27)             	# [57]  id:1727 slave+0x0
	.loc	1	337	0
	ldi	$27,1120($27)             	# [57]  
	.loc	1	328	0
	fldd	$1,800($19)              	# [58]  id:1732 slave+0x0
	.loc	1	333	0
	fldd	$3,2224($21)             	# [59]  id:1742 slave+0x0
	.loc	1	328	0
	faddd	$1,$2,$1                	# [62]  
	.loc	1	333	0
	fldd	$2,-16($21)              	# [63]  id:1741 slave+0x0
	.loc	1	328	0
	faddd	$26,$1,$26              	# [69]  
	fldd	$1,960($19)              	# [70]  id:1728 slave+0x0
	.loc	1	337	0
	ldi	$19,1120($19)             	# [70]  
	.loc	1	333	0
	faddd	$2,$3,$2                	# [73]  
	fldd	$3,56($28)               	# [73]  id:1737 A_bs+0x0
	.loc	1	337	0
	ldi	$28,56($28)               	# [74]  
	.loc	1	328	0
	faddd	$17,$26,$17             	# [76]  
	.loc	1	333	0
	fldd	$26,144($23)             	# [77]  id:1740 A_ls+0x0
	.loc	1	337	0
	ldi	$23,160($23)              	# [77]  
	.loc	1	333	0
	faddd	$26,$2,$26              	# [81]  
	.loc	1	328	0
	faddd	$11,$17,$11             	# [83]  
	fmuld	$11,$5,$11              	# [90]  
	fmad	$1,$4,$11,$1             	# [97]  
	fstd	$1,960($16)              	# [107]  id:1735 slave+0x0
	.loc	1	337	0
	ldi	$16,1120($16)             	# [107]  
	.loc	1	333	0
	fldd	$17,1264($21)            	# [108]  id:1739 slave+0x0
	fldd	$11,1096($21)            	# [109]  id:1738 slave+0x0
	faddd	$17,$26,$17             	# [112]  
	fldd	$2,1104($21)             	# [113]  id:1736 slave+0x0
	.loc	1	337	0
	ldi	$21,1120($21)             	# [113]  
	fldd	$1,-176($10)             	# [114]  id:1749 slave+0x0
	.loc	1	333	0
	faddd	$11,$17,$11             	# [119]  
	.loc	1	337	0
	fldd	$17,144($22)             	# [120]  id:1747 A_rs+0x0
	ldi	$22,160($22)              	# [120]  
	.loc	1	333	0
	faddd	$3,$11,$3               	# [126]  
	.loc	1	337	0
	fldd	$11,936($10)             	# [126]  id:1746 slave+0x0
	.loc	1	333	0
	fmuld	$3,$5,$3                	# [133]  
	fmad	$2,$4,$3,$2              	# [140]  
	.loc	1	337	0
	fldd	$3,2064($10)             	# [140]  id:1750 slave+0x0
	faddd	$1,$3,$1                	# [144]  
	fldd	$3,48($24)               	# [144]  id:1745 A_bs+0x0
	ldi	$24,56($24)               	# [145]  
	.loc	1	333	0
	fstd	$2,1104($20)             	# [150]  id:1743 slave+0x0
	.loc	1	337	0
	fldd	$26,784($10)             	# [151]  id:1748 slave+0x0
	ldi	$20,1120($20)             	# [151]  
	fldd	$2,944($10)              	# [152]  id:1744 slave+0x0
	ldi	$10,1120($10)             	# [152]  
	faddd	$26,$1,$26              	# [155]  
	cmpeq	$8,$12,$1               	# [155]  
	faddd	$17,$26,$17             	# [162]  
	faddd	$11,$17,$11             	# [169]  
	faddd	$3,$11,$3               	# [176]  
	fmuld	$3,$5,$3                	# [183]  
	fmad	$2,$4,$3,$2              	# [190]  
	fstd	$2,944($7)               	# [200]  id:1751 slave+0x0
	ldi	$7,1120($7)               	# [200]  
#<bpre> branch predict taken
	beq	$1,.Lt_1_270              	# [201]  
#Block: 269 Pred: 160 Succ: 161 
.L_BB269_stencil_core:	# 0x2468
#<freq>
#<freq> BB:269 frequency = 0.92799 (heuristic)
#<freq>
#Block: 161 Pred: 269 157 Succ: 162 172 
.Lt_1_266:	# 0x2468
#<freq>
#<freq> BB:161 frequency = 1.00000 (heuristic)
#<freq> BB:161 => BB:162 probability = 0.94030
#<freq> BB:161 => BB:172 probability = 0.05970
#<freq>
	ldl	$3,168($sp)               	# [0]  gra_spill_temp_13
#<bpre> branch predict not taken
	beq	$3,.Lt_1_273              	# [4]  
#Block: 162 Pred: 161 Succ: 164 
.L_BB162_stencil_core:	# 0x2470
#<freq>
#<freq> BB:162 frequency = 0.94030 (heuristic)
#<freq>
	ldl	$6,568($sp)               	# [0]  gra_spill_temp_63
	subw	$14,2,$8                 	# [0]  
	srl	$8,63,$7                  	# [1]  
	subw	$14,4,$11                	# [1]  
	addw	$7,$8,$7                 	# [2]  
	stl	$11,488($sp)              	# [2]  gra_spill_temp_53
	sra	$7,1,$7                   	# [3]  
	mov	$31,$11                   	# [3]  
	stl	$7,184($sp)               	# [4]  gra_spill_temp_15
	subw	$6,2,$6                  	# [4]  
	stl	$31,544($sp)              	# [5]  gra_spill_temp_60
	mov	$31,$17                   	# [5]  
#Block: 164 Pred: 168 162 Succ: 165 168 
.Lt_1_276:	# 0x24a0
#<loop> Loop body line 337, nesting depth: 1, estimated iterations: 2
#<freq>
#<freq> BB:164 frequency = 1.88060 (heuristic)
#<freq> BB:164 => BB:165 probability = 0.92799
#<freq> BB:164 => BB:168 probability = 0.07201
#<freq>
	ldl	$7,632($sp)               	# [0]  gra_spill_temp_71
#<bpre> branch predict not taken
	beq	$7,.Lt_1_277              	# [4]  
#Block: 165 Pred: 164 Succ: 270 
.L_BB165_stencil_core:	# 0x24a8
#<loop> Part of loop body line 337, head labeled .Lt_1_276
#<freq>
#<freq> BB:165 frequency = 1.74517 (heuristic)
#<freq>
	ldl	$27,664($sp)              	# [0]  gra_spill_temp_75
	mov	$31,$23                   	# [0]  
	ldl	$7,720($sp)               	# [1]  gra_spill_temp_82
	addl	$27,$11,$27              	# [4]  
	ldl	$28,704($sp)              	# [5]  gra_spill_temp_80
	addl	$27,$7,$8                	# [8]  
	ldl	$21,536($sp)              	# [9]  gra_spill_temp_59
	addl	$11,$7,$7                	# [9]  
	ldl	$25,528($sp)              	# [10]  gra_spill_temp_58
	addl	$11,$28,$16              	# [12]  
	ldl	$18,712($sp)              	# [13]  gra_spill_temp_81
	addl	$27,$28,$27              	# [13]  
	s8addl	$17,$21,$21            	# [14]  
	s8addl	$17,$25,$25            	# [16]  
	s8addl	$27,$18,$27            	# [17]  
	s8addl	$7,$18,$7              	# [17]  
	s8addl	$8,$18,$8              	# [18]  
	s8addl	$16,$18,$16            	# [18]  
#Block: 270 Pred: 165 Succ: 167 
.L_BB270_stencil_core:	# 0x24f0
#<loop> Part of loop body line 337, head labeled .Lt_1_276
#<freq>
#<freq> BB:270 frequency = 1.74517 (heuristic)
#<freq>
	.loc	1	351	0
# 347         slave[lhs_no][i][j][0] = alpha_d * slave[rhs_no][i][j][0] + \
# 348                       beta_d * (slave[rhs_no][i-1][j][0] + slave[rhs_no][i+1][j][0] +\
# 349                       slave[rhs_no][i][j-1][0] + slave[rhs_no][i][j+1][0]+\
# 350                       A_fs[i][j] + slave[rhs_no][i][j][1]); 
# 351         slave[lhs_no][i][j][k_region] = alpha_d * slave[rhs_no][i][j][k_region] + \
	fldd	$22,2384($8)             	# [0]  
	fldd	$20,1104($8)             	# [1]  
	.loc	1	347	0
	fldd	$18,1280($7)             	# [2]  
	fldd	$24,2400($7)             	# [3]  
	fldd	$19,1120($7)             	# [4]  
#Block: 167 Pred: 167 270 Succ: 271 167 
	.align	4
.Lt_1_281:	# 0x2504
#<loop> Loop body line 337, nesting depth: 2, estimated iterations: 5
#<freq>
#<freq> BB:167 frequency = 8.72585 (heuristic)
#<freq> BB:167 => BB:271 probability = 0.20000
#<freq> BB:167 => BB:167 probability = 0.80000
#<freq>
	fldd	$12,160($7)              	# [0]  id:1757 slave+0x0
	mov	$18,$2                    	# [0]  
	fldd	$18,1440($7)             	# [1]  id:1755 slave+0x0
	.loc	1	351	0
	addw	$23,1,$23                	# [1]  
	.loc	1	347	0
	fldd	$10,64($21)              	# [2]  id:1754 A_fs+0x0
	faddd	$12,$24,$12             	# [4]  
	fldd	$9,1288($7)              	# [5]  id:1753 slave+0x0
	faddd	$19,$12,$12             	# [11]  
	.loc	1	351	0
	fldd	$3,144($8)               	# [12]  id:1765 slave+0x0
	.loc	1	347	0
	faddd	$18,$12,$12             	# [18]  
	.loc	1	351	0
	fldd	$1,1424($8)              	# [19]  id:1763 slave+0x0
	faddd	$3,$22,$3               	# [22]  
	fldd	$26,64($25)              	# [23]  id:1761 A_bs+0x0
	.loc	1	347	0
	faddd	$10,$12,$10             	# [25]  
	fldd	$15,2240($7)             	# [26]  id:1772 slave+0x0
	.loc	1	351	0
	faddd	$20,$3,$3               	# [29]  
	.loc	1	347	0
	fldd	$20,3520($7)             	# [30]  id:1774 slave+0x0
	faddd	$9,$10,$9               	# [32]  
	fldd	$13,120($21)             	# [33]  id:1770 A_fs+0x0
	.loc	1	351	0
	ldi	$21,8($21)                	# [33]  
	.loc	1	347	0
	fldd	$12,2408($7)             	# [34]  id:1769 slave+0x0
	.loc	1	351	0
	faddd	$1,$3,$1                	# [36]  
	fldd	$10,3504($8)             	# [37]  id:1782 slave+0x0
	.loc	1	347	0
	fmuld	$9,$5,$9                	# [39]  
	.loc	1	351	0
	fldd	$3,2224($8)              	# [40]  id:1780 slave+0x0
	.loc	1	347	0
	fmad	$2,$4,$9,$2              	# [46]  
	mov	$24,$9                    	# [47]  
	fldd	$24,2560($7)             	# [47]  id:1771 slave+0x0
	fstd	$2,1280($16)             	# [56]  id:1759 slave+0x0
	.loc	1	351	0
	fldd	$28,1256($8)             	# [57]  id:1762 slave+0x0
	fldd	$22,1264($8)             	# [58]  id:1760 slave+0x0
	faddd	$28,$1,$28              	# [61]  
	fldd	$1,120($25)              	# [62]  id:1777 A_bs+0x0
	ldi	$25,8($25)                	# [62]  
	faddd	$26,$28,$26             	# [68]  
	fmuld	$26,$5,$26              	# [75]  
	fmad	$22,$4,$26,$22           	# [82]  
	cmpeq	$23,$6,$26              	# [82]  
	fstd	$22,1264($27)            	# [92]  id:1767 slave+0x0
	.loc	1	347	0
	fldd	$19,1280($7)             	# [93]  id:1773 slave+0x0
	.loc	1	351	0
	ldi	$7,160($7)                	# [93]  
	fldd	$22,2544($8)             	# [94]  id:1779 slave+0x0
	.loc	1	347	0
	faddd	$19,$20,$20             	# [97]  
	faddd	$15,$20,$15             	# [104]  
	.loc	1	351	0
	fldd	$20,1264($8)             	# [104]  id:1781 slave+0x0
	faddd	$20,$10,$10             	# [108]  
	.loc	1	347	0
	faddd	$24,$15,$15             	# [111]  
	.loc	1	351	0
	faddd	$3,$10,$3               	# [115]  
	.loc	1	347	0
	faddd	$13,$15,$13             	# [118]  
	.loc	1	351	0
	faddd	$22,$3,$3               	# [122]  
	.loc	1	347	0
	faddd	$12,$13,$12             	# [125]  
	fmuld	$12,$5,$12              	# [132]  
	fmad	$9,$4,$12,$9             	# [139]  
	fstd	$9,2400($16)             	# [149]  id:1775 slave+0x0
	.loc	1	351	0
	ldi	$16,160($16)              	# [149]  
	fldd	$2,2376($8)              	# [150]  id:1778 slave+0x0
	fldd	$28,2384($8)             	# [151]  id:1776 slave+0x0
	ldi	$8,160($8)                	# [151]  
	faddd	$2,$3,$2                	# [154]  
	faddd	$1,$2,$1                	# [161]  
	fmuld	$1,$5,$1                	# [168]  
	fmad	$28,$4,$1,$28            	# [175]  
	fstd	$28,2384($27)            	# [185]  id:1783 slave+0x0
	ldi	$27,160($27)              	# [185]  
#<bpre> branch predict taken
	beq	$26,.Lt_1_281             	# [186]  
#Block: 271 Pred: 167 Succ: 168 
.L_BB271_stencil_core:	# 0x2608
#<loop> Part of loop body line 337, head labeled .Lt_1_276
#<freq>
#<freq> BB:271 frequency = 1.74517 (heuristic)
#<freq>
#Block: 168 Pred: 271 164 Succ: 169 164 
.Lt_1_277:	# 0x2608
#<loop> Part of loop body line 337, head labeled .Lt_1_276
#<freq>
#<freq> BB:168 frequency = 1.88060 (heuristic)
#<freq> BB:168 => BB:169 probability = 0.50000
#<freq> BB:168 => BB:164 probability = 0.50000
#<freq>
	ldl	$16,544($sp)              	# [0]  gra_spill_temp_60
	ldi	$17,14($17)               	# [0]  
	ldl	$18,488($sp)              	# [1]  gra_spill_temp_53
	ldi	$11,280($11)              	# [1]  
	addw	$16,2,$16                	# [4]  
	stl	$16,544($sp)              	# [5]  gra_spill_temp_60
	cmple	$16,$18,$16             	# [5]  
#<bpre> branch predict unknown
	bne	$16,.Lt_1_276             	# [6]  
#Block: 169 Pred: 168 Succ: 181 170 
.L_BB169_stencil_core:	# 0x2628
#<freq>
#<freq> BB:169 frequency = 0.94030 (heuristic)
#<freq> BB:169 => BB:181 probability = 0.50000
#<freq> BB:169 => BB:170 probability = 0.50000
#<freq>
	ldl	$19,544($sp)              	# [0]  gra_spill_temp_60
	subw	$14,3,$20                	# [0]  
	cmple	$19,$20,$19             	# [4]  
#<bpre> branch predict unknown
	beq	$19,.Lt_1_286             	# [5]  
#Block: 170 Pred: 169 172 Succ: 171 181 
.Lt_1_313:	# 0x2638
#<freq>
#<freq> BB:170 frequency = 0.52030 (heuristic)
#<freq> BB:170 => BB:171 probability = 0.94030
#<freq> BB:170 => BB:181 probability = 0.05970
#<freq>
	ldl	$21,632($sp)              	# [0]  gra_spill_temp_71
#<bpre> branch predict not taken
	beq	$21,.Lt_1_286             	# [4]  
#Block: 171 Pred: 170 Succ: 177 
.L_BB171_stencil_core:	# 0x2640
#<freq>
#<freq> BB:171 frequency = 0.48924 (heuristic)
#<freq>
	ldl	$23,544($sp)              	# [0]  gra_spill_temp_60
	subw	$14,2,$12                	# [0]  
	ldl	$6,568($sp)               	# [1]  gra_spill_temp_63
	sll	$23,2,$24                 	# [4]  
	s8subl	$24,$24,$24            	# [5]  
	s8subl	$23,$23,$22            	# [5]  
	s4addl	$24,$24,$24            	# [6]  
	subw	$6,2,$6                  	# [8]  
#Block: 177 Pred: 180 171 Succ: 272 
.Lt_1_290:	# 0x2660
#<loop> Loop body line 351, nesting depth: 1, estimated iterations: 1
#<freq>
#<freq> BB:177 frequency = 0.48924 (heuristic)
#<freq>
	ldl	$19,664($sp)              	# [0]  gra_spill_temp_75
	mov	$31,$18                   	# [0]  
	ldl	$16,720($sp)              	# [1]  gra_spill_temp_82
	mov	$24,$15                   	# [1]  
	ldl	$20,704($sp)              	# [2]  gra_spill_temp_80
	addl	$19,$24,$19              	# [4]  
	addl	$19,$16,$8               	# [5]  
	ldl	$21,528($sp)              	# [5]  gra_spill_temp_58
	ldl	$13,712($sp)              	# [6]  gra_spill_temp_81
	addl	$24,$16,$16              	# [6]  
	addl	$19,$20,$19              	# [8]  
	addl	$24,$20,$7               	# [8]  
	ldl	$20,536($sp)              	# [9]  gra_spill_temp_59
	s8addl	$22,$21,$21            	# [9]  
	s8addl	$7,$13,$7              	# [10]  
	s8addl	$19,$13,$19            	# [10]  
	s8addl	$16,$13,$16            	# [11]  
	s8addl	$8,$13,$8              	# [11]  
	mov	$22,$13                   	# [12]  
	s8addl	$22,$20,$20            	# [13]  
#Block: 272 Pred: 177 Succ: 276 275 
.L_BB272_stencil_core:	# 0x26b0
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<freq>
#<freq> BB:272 frequency = 0.48924 (heuristic)
#<freq> BB:272 => BB:276 probability = 0.50000
#<freq> BB:272 => BB:275 probability = 0.50000
#<freq>
	.loc	1	347	0
	fldd	$24,1280($16)            	# [0]  
	and	$6,1,$25                  	# [0]  
	mov	$24,$22                   	# [4]  
#<bpre> branch predict unknown
	beq	$25,.L_BB275_stencil_core 	# [4]  
#Block: 276 Pred: 272 Succ: 275 
.L_BB276_stencil_core:	# 0x26c0
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<loop> Unrolling remainder loop (at most 1 iteration)
#<freq>
#<freq> BB:276 frequency = 0.24462 (heuristic)
#<freq>
	fldd	$3,2400($16)             	# [0]  id:1790 slave+0x0
	fldd	$2,160($16)              	# [1]  id:1789 slave+0x0
	fldd	$1,1120($16)             	# [2]  id:1788 slave+0x0
	faddd	$2,$3,$2                	# [5]  
	fldd	$22,1440($16)            	# [6]  id:1787 slave+0x0
	faddd	$1,$2,$1                	# [12]  
	fldd	$28,64($20)              	# [13]  id:1786 A_fs+0x0
	.loc	1	351	0
	ldi	$20,8($20)                	# [13]  
	.loc	1	347	0
	fldd	$27,1288($16)            	# [14]  id:1785 slave+0x0
	.loc	1	351	0
	ldi	$16,160($16)              	# [14]  
	fldd	$25,2384($8)             	# [15]  id:1798 slave+0x0
	.loc	1	347	0
	faddd	$22,$1,$1               	# [19]  
	.loc	1	351	0
	fldd	$18,144($8)              	# [20]  id:1797 slave+0x0
	.loc	1	347	0
	faddd	$28,$1,$28              	# [26]  
	.loc	1	351	0
	fldd	$3,1104($8)              	# [27]  id:1796 slave+0x0
	faddd	$18,$25,$18             	# [30]  
	fldd	$2,1424($8)              	# [31]  id:1795 slave+0x0
	.loc	1	347	0
	faddd	$27,$28,$27             	# [33]  
	.loc	1	351	0
	fldd	$28,64($21)              	# [34]  id:1793 A_bs+0x0
	ldi	$21,8($21)                	# [34]  
	faddd	$3,$18,$3               	# [37]  
	addw	$31,1,$18                	# [37]  
	.loc	1	347	0
	fmuld	$27,$5,$27              	# [40]  
	.loc	1	351	0
	faddd	$2,$3,$2                	# [44]  
	.loc	1	347	0
	fmad	$24,$4,$27,$27           	# [47]  
	fstd	$27,1280($7)             	# [57]  id:1791 slave+0x0
	.loc	1	351	0
	ldi	$7,160($7)                	# [57]  
	fldd	$1,1256($8)              	# [58]  id:1794 slave+0x0
	fldd	$27,1264($8)             	# [59]  id:1792 slave+0x0
	ldi	$8,160($8)                	# [59]  
	faddd	$1,$2,$1                	# [62]  
	faddd	$28,$1,$28              	# [69]  
	fmuld	$28,$5,$28              	# [76]  
	fmad	$27,$4,$28,$27           	# [83]  
	fstd	$27,1264($19)            	# [93]  id:1799 slave+0x0
	ldi	$19,160($19)              	# [93]  
#Block: 275 Pred: 272 276 Succ: 278 277 
.L_BB275_stencil_core:	# 0x2750
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<freq>
#<freq> BB:275 frequency = 0.48924 (heuristic)
#<freq> BB:275 => BB:278 probability = 0.50000
#<freq> BB:275 => BB:277 probability = 0.50000
#<freq>
	sra	$6,1,$26                  	# [0]  
#<bpre> branch predict unknown
	beq	$26,.L_BB277_stencil_core 	# [1]  
#Block: 278 Pred: 275 Succ: 274 
.L_BB278_stencil_core:	# 0x2758
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<freq>
#<freq> BB:278 frequency = 0.24462 (heuristic)
#<freq>
#Block: 274 Pred: 274 278 Succ: 274 279 
.L_BB274_stencil_core:	# 0x2758
#<loop> Loop body line 351, nesting depth: 2, estimated iterations: 2
#<loop> unrolled 2 times
#<freq>
#<freq> BB:274 frequency = 0.85616 (heuristic)
#<freq> BB:274 => BB:274 probability = 0.50000
#<freq> BB:274 => BB:279 probability = 0.50000
#<freq>
	.loc	1	347	0
	fldd	$24,2400($16)            	# [0]  id:1790 slave+0x0
	.loc	1	351	0
	addw	$18,2,$18                	# [0]  
	.loc	1	347	0
	fldd	$10,160($16)             	# [1]  id:1789 slave+0x0
	fldd	$9,1120($16)             	# [2]  id:1788 slave+0x0
	faddd	$10,$24,$10             	# [5]  
	fldd	$28,1440($16)            	# [6]  id:1787 slave+0x0
	faddd	$9,$10,$9               	# [12]  
	fldd	$3,64($20)               	# [13]  id:1786 A_fs+0x0
	faddd	$28,$9,$9               	# [19]  
	fldd	$2,1288($16)             	# [20]  id:1785 slave+0x0
	faddd	$3,$9,$3                	# [26]  
	.loc	1	351	0
	fldd	$9,144($8)               	# [27]  id:1797 slave+0x0
	.loc	1	347	0
	faddd	$2,$3,$2                	# [33]  
	.loc	1	351	0
	fldd	$10,2384($8)             	# [34]  id:1798 slave+0x0
	.loc	1	347	0
	fmuld	$2,$5,$2                	# [40]  
	.loc	1	351	0
	fldd	$3,1104($8)              	# [41]  id:1796 slave+0x0
	faddd	$9,$10,$9               	# [44]  
	fldd	$1,1424($8)              	# [45]  id:1795 slave+0x0
	.loc	1	347	0
	fmad	$22,$4,$2,$2             	# [47]  
	.loc	1	351	0
	fldd	$25,64($21)              	# [48]  id:1793 A_bs+0x0
	faddd	$3,$9,$3                	# [51]  
	.loc	1	347	0
	fldd	$22,320($16)             	# [52]  id:1789 slave+0x0
	.loc	1	351	0
	faddd	$1,$3,$1                	# [58]  
	.loc	1	347	0
	fstd	$2,1280($7)              	# [59]  id:1791 slave+0x0
	.loc	1	351	0
	fldd	$27,1256($8)             	# [60]  id:1794 slave+0x0
	fldd	$24,1264($8)             	# [61]  id:1792 slave+0x0
	faddd	$27,$1,$27              	# [65]  
	.loc	1	347	0
	fldd	$9,72($20)               	# [66]  id:1786 A_fs+0x0
	.loc	1	351	0
	ldi	$20,16($20)               	# [66]  
	.loc	1	347	0
	fldd	$3,1448($16)             	# [67]  id:1785 slave+0x0
	.loc	1	351	0
	faddd	$25,$27,$25             	# [72]  
	fldd	$2,304($8)               	# [73]  id:1797 slave+0x0
	fmuld	$25,$5,$25              	# [79]  
	fldd	$27,1584($8)             	# [80]  id:1795 slave+0x0
	fmad	$24,$4,$25,$24           	# [86]  
	.loc	1	347	0
	fldd	$25,2560($16)            	# [87]  id:1790 slave+0x0
	faddd	$22,$25,$22             	# [91]  
	.loc	1	351	0
	fstd	$24,1264($19)            	# [96]  id:1799 slave+0x0
	.loc	1	347	0
	fldd	$10,1280($16)            	# [97]  id:1788 slave+0x0
	.loc	1	351	0
	fldd	$1,1264($8)              	# [98]  id:1796 slave+0x0
	.loc	1	347	0
	faddd	$10,$22,$10             	# [101]  
	fldd	$22,1600($16)            	# [102]  id:1787 slave+0x0
	.loc	1	351	0
	ldi	$16,320($16)              	# [102]  
	fldd	$24,72($21)              	# [103]  id:1793 A_bs+0x0
	ldi	$21,16($21)               	# [103]  
	.loc	1	347	0
	faddd	$22,$10,$10             	# [108]  
	faddd	$9,$10,$9               	# [115]  
	faddd	$3,$9,$3                	# [122]  
	.loc	1	351	0
	fldd	$9,2544($8)              	# [122]  id:1798 slave+0x0
	faddd	$2,$9,$2                	# [126]  
	cmpeq	$18,$6,$9               	# [126]  
	.loc	1	347	0
	fmuld	$3,$5,$3                	# [129]  
	.loc	1	351	0
	faddd	$1,$2,$1                	# [133]  
	.loc	1	347	0
	fmad	$28,$4,$3,$28            	# [136]  
	.loc	1	351	0
	faddd	$27,$1,$27              	# [140]  
	.loc	1	347	0
	fstd	$28,1440($7)             	# [146]  id:1791 slave+0x0
	.loc	1	351	0
	fldd	$25,1416($8)             	# [147]  id:1794 slave+0x0
	ldi	$7,320($7)                	# [147]  
	fldd	$10,1424($8)             	# [148]  id:1792 slave+0x0
	ldi	$8,320($8)                	# [148]  
	faddd	$25,$27,$25             	# [151]  
	faddd	$24,$25,$24             	# [158]  
	fmuld	$24,$5,$24              	# [165]  
	fmad	$10,$4,$24,$10           	# [172]  
	fstd	$10,1424($19)            	# [182]  id:1799 slave+0x0
	ldi	$19,320($19)              	# [182]  
#<bpre> branch predict unknown
	beq	$9,.L_BB274_stencil_core  	# [183]  
#Block: 279 Pred: 274 Succ: 277 
.L_BB279_stencil_core:	# 0x2864
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<freq>
#<freq> BB:279 frequency = 0.42808 (heuristic)
#<freq>
#Block: 277 Pred: 275 279 Succ: 273 
.L_BB277_stencil_core:	# 0x2864
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<freq>
#<freq> BB:277 frequency = 0.00000 (heuristic)
#<freq>
#Block: 273 Pred: 277 Succ: 180 
.L_BB273_stencil_core:	# 0x2864
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<freq>
#<freq> BB:273 frequency = 0.48924 (heuristic)
#<freq>
#Block: 180 Pred: 273 Succ: 181 177 
.L_BB180_stencil_core:	# 0x2864
#<loop> Part of loop body line 351, head labeled .Lt_1_290
#<freq>
#<freq> BB:180 frequency = 0.48924 (heuristic)
#<freq> BB:180 => BB:181 probability = 1.00000
#<freq> BB:180 => BB:177 probability = 0.00000
#<freq>
	addw	$23,1,$23                	# [0]  
	ldi	$24,140($15)              	# [0]  
	cmpeq	$23,$12,$25             	# [1]  
	ldi	$22,7($13)                	# [1]  
#<bpre> branch predict not taken
	beq	$25,.Lt_1_290.bpre        	# [2]  
#Block: 181 Pred: 170 180 169 318 Succ: 182 
.Lt_1_286:	# 0x2878
.Lt_1_284:	# 0x2878
#<freq>
#<freq> BB:181 frequency = 1.00000 (heuristic)
#<freq>
	.loc	1	357	0
# 353                       slave[rhs_no][i][j-1][k_region] + slave[rhs_no][i][j+1][k_region]+\
# 354                       slave[rhs_no][i][j][k_k] + A_bs[i][j]);  
# 355      }
# 356  #ifdef _PROFILING
# 357    comp_et=rtc_();
	bsr	$26,$ng..rtc_             	# [0]  rtc_
#Block: 182 Pred: 181 Succ: 183 
.L_BB182_stencil_core:	# 0x287c
#<freq>
#<freq> BB:182 frequency = 1.00000 (heuristic)
#<freq>
	ldi	$15,comp_et($31)          	!tprello	# [0]  comp_et
	stl	$0,0($15)                 	# [1]  id:1800 comp_et+0x0
	.loc	1	358	0
# 358    dma_st_=rtc_();
	bsr	$26,$ng..rtc_             	# [2]  rtc_
#Block: 183 Pred: 182 Succ: 184 188 
.L_BB183_stencil_core:	# 0x2888
#<freq>
#<freq> BB:183 frequency = 1.00000 (heuristic)
#<freq> BB:183 => BB:184 probability = 0.78423
#<freq> BB:183 => BB:188 probability = 0.21577
#<freq>
	.loc	1	361	0
# 359  #endif
# 360    //12 write back
# 361     put_reply=0;
	ldl	$27,448($sp)              	# [0]  gra_spill_temp_48
	.loc	1	358	0
	ldi	$28,dma_st_($31)          	!tprello	# [0]  dma_st_
	stl	$0,0($28)                 	# [1]  id:1801 dma_st_+0x0
	ldi	$13,put_reply($31)        	!tprello	# [1]  put_reply
	.loc	1	361	0
	stl	$31,0($13)                	# [2]  id:1802 put_reply+0x0
	.loc	1	358	0
	stl	$28,224($sp)              	# [3]  gra_spill_temp_20
	.loc	1	361	0
#<bpre> branch predict not taken
	beq	$27,.Lt_1_296             	# [4]  
#Block: 184 Pred: 183 Succ: 280 
.L_BB184_stencil_core:	# 0x28a4
#<freq>
#<freq> BB:184 frequency = 0.78423 (heuristic)
#<freq>
	ldl	$16,312($sp)              	# [0]  gra_spill_temp_31
	ldi	$9,29680($31)             	# [0]  
	ldl	$12,304($sp)              	# [1]  gra_spill_temp_30
	ldih	$9,1($9)                 	# [1]  
	ldl	$11,216($sp)              	# [2]  gra_spill_temp_19
	addl	$12,$16,$12              	# [5]  
	ldl	$10,A($gp)                	!literal	# [6]  A
	addl	$11,$12,$11              	# [9]  
	mov	$31,$12                   	# [10]  
	addl	$10,$11,$10              	# [13]  
	ldl	$11,208($sp)              	# [14]  gra_spill_temp_18
	ldi	$10,8($10)                	# [14]  
#Block: 280 Pred: 184 Succ: 186 
.L_BB280_stencil_core:	# 0x28d4
#<freq>
#<freq> BB:280 frequency = 0.78423 (heuristic)
#<freq>
#Block: 186 Pred: 187 280 Succ: 187 
	.align	4
.Lt_1_300:	# 0x28d4
#<loop> Loop body line 361, nesting depth: 1, estimated iterations: 100
#<freq>
#<freq> BB:186 frequency = 78.42323 (heuristic)
#<freq>
	.loc	1	368	0
# 364     len = bsize*BLKY;
# 365     for(i =  s_starti; i < s_endi; ++i)
# 366       athread_put(PE_MODE,&slave[lhs_no][i-s_starti][0][0]
# 367                       , &A[dest][i][s_startj][s_startk]
# 368                       ,len,&put_reply,stride,bsize);
	mov	160,$17                   	# [0]  
	mov	16,$21                    	# [0]  
	stl	$17,0($sp)                	# [1]  id:1825
	mov	$13,$20                   	# [1]  
	ldi	$19,1120($31)             	# [2]  
	mov	$10,$18                   	# [2]  
	mov	$11,$17                   	# [3]  
	mov	$31,$16                   	# [3]  
	.globl	athread_put
	bsr	$26,athread_put           	# [4]  athread_put
#Block: 187 Pred: 186 Succ: 281 186 
.L_BB187_stencil_core:	# 0x28f8
#<loop> Part of loop body line 361, head labeled .Lt_1_300
#<freq>
#<freq> BB:187 frequency = 78.42323 (heuristic)
#<freq> BB:187 => BB:281 probability = 0.01000
#<freq> BB:187 => BB:186 probability = 0.99000
#<freq>
	addw	$12,1,$12                	# [4]  
	ldi	$11,1120($11)             	# [4]  
	cmpeq	$12,$14,$18             	# [5]  
	addl	$10,$9,$10               	# [5]  
#<bpre> branch predict taken
	beq	$18,.Lt_1_300             	# [6]  
#Block: 281 Pred: 187 Succ: 188 
.L_BB281_stencil_core:	# 0x290c
#<freq>
#<freq> BB:281 frequency = 0.78423 (heuristic)
#<freq>
#Block: 188 Pred: 281 183 Succ: 282 190 
.Lt_1_296:	# 0x290c
#<freq>
#<freq> BB:188 frequency = 1.00000 (heuristic)
#<freq> BB:188 => BB:282 probability = 0.94030
#<freq> BB:188 => BB:190 probability = 0.05970
#<freq>
	ldl	$19,0($13)                	# [0]  id:1802 put_reply+0x0
	ldl	$14,784($sp)              	# [1]  gra_spill_temp_90
	cmpeq	$19,7,$19               	# [4]  
#<bpre> branch predict not taken
	bne	$19,.Lt_1_302             	# [5]  
#Block: 282 Pred: 188 Succ: 284 
.L_BB282_stencil_core:	# 0x291c
#<freq>
#<freq> BB:282 frequency = 0.94030 (heuristic)
#<freq>
#Block: 284 Pred: 189 282 Succ: 283 285 
.L_BB284_stencil_core:	# 0x291c
#<loop> Loop body line 368
#<loop> unrolled 3 times
#<freq>
#<freq> BB:284 frequency = 3.27861 (heuristic)
#<freq> BB:284 => BB:283 probability = 0.12000
#<freq> BB:284 => BB:285 probability = 0.88000
#<freq>
	ldl	$20,0($13)                	# [0]  id:1802 put_reply+0x0
	cmpeq	$20,7,$20               	# [4]  
#<bpre> branch predict not taken
	bne	$20,.L_BB283_stencil_core 	# [5]  
#Block: 285 Pred: 284 Succ: 283 189 
.L_BB285_stencil_core:	# 0x2928
#<loop> Part of loop body line 368, head labeled .L_BB284_stencil_core
#<loop> unrolled 3 times
#<freq>
#<freq> BB:285 frequency = 2.88517 (heuristic)
#<freq> BB:285 => BB:283 probability = 0.12000
#<freq> BB:285 => BB:189 probability = 0.88000
#<freq>
	ldl	$21,0($13)                	# [5]  id:1802 put_reply+0x0
	cmpeq	$21,7,$21               	# [9]  
#<bpre> branch predict not taken
	bne	$21,.L_BB283_stencil_core 	# [10]  
#Block: 189 Pred: 285 Succ: 283 284 
.Lt_1_304:	# 0x2934
#<loop> Part of loop body line 368, head labeled .L_BB284_stencil_core
#<freq>
#<freq> BB:189 frequency = 2.53895 (heuristic)
#<freq> BB:189 => BB:283 probability = 0.12000
#<freq> BB:189 => BB:284 probability = 0.88000
#<freq>
	ldl	$22,0($13)                	# [10]  id:1802 put_reply+0x0
	cmpeq	$22,7,$22               	# [14]  
#<bpre> branch predict taken
	beq	$22,.L_BB284_stencil_core 	# [15]  
#Block: 283 Pred: 189 284 285 Succ: 190 
.L_BB283_stencil_core:	# 0x2940
#<freq>
#<freq> BB:283 frequency = 0.94030 (heuristic)
#<freq>
#Block: 190 Pred: 283 188 Succ: 191 
.Lt_1_302:	# 0x2940
#<freq>
#<freq> BB:190 frequency = 1.00000 (heuristic)
#<freq>
	ldl	$13,760($sp)              	# [0]  gra_spill_temp_87
	ldl	$12,224($sp)              	# [1]  gra_spill_temp_20
	ldl	$9,768($sp)               	# [2]  gra_spill_temp_88
	ldl	$11,776($sp)              	# [3]  gra_spill_temp_89
	.loc	1	371	0
# 369     while(put_reply!=(BLKX)); 
# 370  #ifdef _PROFILING
# 371    dma_et_=rtc_();
	bsr	$26,$ng..rtc_             	# [4]  rtc_
#Block: 191 Pred: 190 Succ: 192 
.L_BB191_stencil_core:	# 0x2954
#<freq>
#<freq> BB:191 frequency = 1.00000 (heuristic)
#<freq>
	ldi	$10,dma_et_($31)          	!tprello	# [10]  dma_et_
	stl	$0,0($10)                 	# [11]  id:1803 dma_et_+0x0
	.loc	1	372	0
# 372    end=rtc_();
	bsr	$26,$ng..rtc_             	# [12]  rtc_
#Block: 192 Pred: 191 Succ: 
.L_BB192_stencil_core:	# 0x2960
#<freq>
#<freq> BB:192 frequency = 1.00000 (heuristic)
#<freq>
	ldi	$27,end($31)              	!tprello	# [0]  end
	.loc	1	373	0
# 373    slave_dma_count[core_id]+=((dma_et_-dma_st_)+(dma_et-dma_st));
	ldl	$23,240($sp)              	# [0]  gra_spill_temp_22
	.loc	1	372	0
	stl	$0,0($27)                 	# [1]  id:1804 end+0x0
	.loc	1	373	0
#	.body
#	.label_state 1
	ldl	$0,0($10)                 	# [2]  id:1803 dma_et_+0x0
	ldl	$1,0($12)                 	# [3]  id:1801 dma_st_+0x0
	ldl	$2,416($sp)               	# [4]  gra_spill_temp_44
	subl	$0,$1,$0                 	# [7]  
	ldl	$1,296($sp)               	# [8]  gra_spill_temp_29
	ldw	$23,0($23)                	# [9]  id:1363 core_id+0x0
	.globl	slave_dma_count
	ldl	$26,slave_dma_count($gp)  	!literal	# [10]  slave_dma_count
	.loc	1	374	0
# 374    slave_comp_dma_count[core_id]+=(end-start);
	.globl	slave_comp_dma_count
	ldl	$25,slave_comp_dma_count($gp)	!literal	# [11]  slave_comp_dma_count
	.loc	1	373	0
	s8addl	$23,$26,$26            	# [14]  
	ldl	$1,0($1)                  	# [15]  id:1382 dma_et+0x0
	.loc	1	374	0
	s8addl	$23,$25,$25            	# [18]  
	.loc	1	373	0
	ldl	$2,0($2)                  	# [19]  id:1377 dma_st+0x0
	ldl	$28,0($26)                	# [20]  id:1805 slave_dma_count+0x0
	subl	$1,$2,$1                 	# [23]  
	addl	$0,$1,$0                 	# [24]  
	.loc	1	374	0
	ldl	$27,0($27)                	# [24]  id:1804 end+0x0
	.loc	1	373	0
	addl	$28,$0,$28               	# [25]  
	.loc	1	375	0
# 375    slave_comp_count[core_id]+=(comp_et-comp_st);
	.globl	slave_comp_count
	ldl	$24,slave_comp_count($gp) 	!literal	# [25]  slave_comp_count
	.loc	1	373	0
	stl	$28,0($26)                	# [26]  id:1806 slave_dma_count+0x0
	.loc	1	375	0
	s8addl	$23,$24,$23            	# [29]  
	.loc	1	374	0
	ldl	$28,280($sp)              	# [30]  gra_spill_temp_27
	ldl	$26,0($25)                	# [31]  id:1807 slave_comp_dma_count+0x0
	.loc	1	375	0
	ldl	$24,0($23)                	# [32]  id:1809 slave_comp_count+0x0
	.loc	1	377	0
# 376  #endif
# 377  }
	ldl	$12,248($sp)              	# [33]  gra_spill_temp_23
	.loc	1	374	0
	ldl	$28,0($28)                	# [34]  id:1364 start+0x0
	.loc	1	377	0
	ldl	$10,232($sp)              	# [35]  gra_spill_temp_21
	.loc	1	374	0
#	.body
	subl	$27,$28,$27              	# [38]  
	addl	$26,$27,$26              	# [39]  
	stl	$26,0($25)                	# [40]  id:1808 slave_comp_dma_count+0x0
	.loc	1	375	0
	ldl	$26,160($sp)              	# [41]  gra_spill_temp_12
	ldl	$25,0($15)                	# [42]  id:1800 comp_et+0x0
	.loc	1	377	0
	ldl	$15,264($sp)              	# [43]  gra_spill_temp_25
	.loc	1	375	0
	ldl	$26,0($26)                	# [45]  id:1383 comp_st+0x0
	subl	$25,$26,$25              	# [49]  
	addl	$24,$25,$24              	# [50]  
	stl	$24,0($23)                	# [51]  id:1810 slave_comp_count+0x0
	.loc	1	377	0
	ldl	$26,16($sp)               	# [52]  return_address
	ldi	$sp,832($sp)              	# [52]  
	ret	$31,($26),1               	# [56]  
#Block: 72 Pred: 43 Succ: 73 75 
.Lt_1_147:	# 0x2a08
#<freq>
#<freq> BB:72 frequency = 0.25000 (heuristic)
#<freq> BB:72 => BB:73 probability = 0.50000
#<freq> BB:72 => BB:75 probability = 0.50000
#<freq>
	.loc	1	183	0
	mov	3,$24                     	# [0]  
#	.restore $sp
	stl	$8,160($sp)               	# [0]  gra_spill_temp_12
	cmple	$24,$14,$24             	# [1]  
#	.body
#	.copy_state 1
#	.spillsp $9, 0
#	.spillsp $11, 0
#	.spillsp $13, 0
#	.spillsp $14, 0
	stl	$16,168($sp)              	# [1]  gra_spill_temp_13
	stl	$24,552($sp)              	# [2]  gra_spill_temp_61
	stl	$31,512($sp)              	# [3]  gra_spill_temp_56
#<bpre> branch predict unknown
	beq	$24,.Lt_1_322             	# [4]  
#Block: 73 Pred: 72 Succ: 71 
.L_BB73_stencil_core:	# 0x2a24
#<freq>
#<freq> BB:73 frequency = 0.12500 (heuristic)
#<freq>
	ldl	$16,272($sp)              	# [0]  gra_spill_temp_26
	sll	$13,2,$17                 	# [0]  
	ldl	$19,464($sp)              	# [1]  gra_spill_temp_50
	s8subl	$17,$17,$17            	# [1]  
	ldl	$7,664($sp)               	# [2]  gra_spill_temp_75
	ldi	$12,27892($31)            	# [2]  
	ldi	$8,-27263($31)            	# [3]  
	ldih	$12,16310($12)           	# [3]  
	sll	$16,2,$16                 	# [4]  
	ldih	$8,16308($8)             	# [4]  
	s8subl	$16,$16,$16            	# [5]  
	s8subl	$17,$17,$17            	# [5]  
	s8subl	$16,$16,$16            	# [6]  
	subw	$10,$19,$19              	# [6]  
	mov	4,$18                     	# [7]  
	mov	4,$22                     	# [7]  
	mov	3,$21                     	# [8]  
	ldi	$4,11639($31)             	# [8]  
	ldi	$5,-8913($31)             	# [9]  
	ldih	$4,7969($4)              	# [9]  
	ldih	$5,1573($5)              	# [10]  
	cmple	$21,$19,$21             	# [10]  
	cmple	$22,$19,$22             	# [11]  
	cmple	$18,$7,$18              	# [11]  
	stl	$19,568($sp)              	# [12]  gra_spill_temp_63
	subw	$19,2,$6                 	# [12]  
	subw	$19,4,$20                	# [13]  
	subw	$19,3,$19                	# [13]  
	s4addl	$16,$16,$16            	# [14]  
	s4addl	$17,$17,$17            	# [14]  
	sll	$8,32,$8                  	# [15]  
	sll	$12,32,$12                	# [15]  
	addl	$4,$12,$4                	# [16]  
	subw	$14,2,$12                	# [16]  
	addl	$5,$8,$5                 	# [17]  
	stl	$17,720($sp)              	# [17]  gra_spill_temp_82
	stl	$16,704($sp)              	# [18]  gra_spill_temp_80
	subw	$7,3,$7                  	# [18]  
	stl	$19,432($sp)              	# [19]  gra_spill_temp_46
	stl	$20,472($sp)              	# [20]  gra_spill_temp_51
	stl	$18,576($sp)              	# [21]  gra_spill_temp_64
	stl	$22,440($sp)              	# [22]  gra_spill_temp_47
	stl	$21,632($sp)              	# [23]  gra_spill_temp_71
	br	$31,.Lt_1_307              	# [24]  
#Block: 121 Pred: 110 Succ: 119 316 
.Lt_1_213:	# 0x2ad4
#<freq>
#<freq> BB:121 frequency = 0.25000 (heuristic)
#<freq> BB:121 => BB:119 probability = 0.84000
#<freq> BB:121 => BB:316 probability = 0.16000
#<freq>
	.loc	1	218	0
	ldl	$17,576($sp)              	# [0]  gra_spill_temp_64
	stl	$31,672($sp)              	# [1]  gra_spill_temp_76
#<bpre> branch predict taken
	bne	$17,.Lt_1_310             	# [4]  
#Block: 316 Pred: 121 Succ: 130 
.L_BB316_stencil_core:	# 0x2ae0
#<freq>
#<freq> BB:316 frequency = 0.04000 (heuristic)
#<freq>
	br	$31,.Lt_1_226              	# [0]  
#Block: 30 Pred: 23 Succ: 31 
.Lt_1_129:	# 0x2ae4
#<freq>
#<freq> BB:30 frequency = 0.21577 (heuristic)
#<freq>
	.loc	1	139	0
	ldl	$18,664($sp)              	# [0]  gra_spill_temp_75
	ldi	$19,A_fs($31)             	!tprello	# [0]  A_fs
	ldi	$20,A_bs($31)             	!tprello	# [1]  A_bs
	stl	$19,536($sp)              	# [1]  gra_spill_temp_59
	stl	$20,528($sp)              	# [2]  gra_spill_temp_58
	s8addl	$18,$31,$18            	# [4]  
	stl	$18,144($sp)              	# [5]  gra_spill_temp_10
	stl	$5,752($sp)               	# [6]  gra_spill_temp_86
	br	$31,.Lt_1_128              	# [7]  
#Block: 14 Pred: 13 Succ: 15 20 
.L_BB14_stencil_core:	# 0x2b08
#<freq>
#<freq> BB:14 frequency = 0.15184 (heuristic)
#<freq> BB:14 => BB:15 probability = 0.40909
#<freq> BB:14 => BB:20 probability = 0.59091
#<freq>
	.loc	1	113	0
	ldl	$16,520($sp)              	# [0]  gra_spill_temp_57
	ldl	$14,256($sp)              	# [1]  gra_spill_temp_24
	ldl	$21,448($sp)              	# [2]  gra_spill_temp_48
#	.restorereg $15
	subw	$14,$16,$14              	# [5]  
#<bpre> branch predict taken
	br .L_BB14_stencil_core.bpre1
.Lt_1_123.bpre.L_BB14_stencil_core:
	br .Lt_1_123
.L_BB14_stencil_core.bpre1:
	beq	$21,.Lt_1_123.bpre.L_BB14_stencil_core 	# [9]  
#Block: 15 Pred: 14 Succ: 200 
.L_BB15_stencil_core:	# 0x2b1c
#<freq>
#<freq> BB:15 frequency = 0.06212 (heuristic)
#<freq>
	ldl	$20,520($sp)              	# [0]  gra_spill_temp_57
	sll	$13,5,$10                 	# [0]  
	ldl	$16,464($sp)              	# [1]  gra_spill_temp_50
	s8subl	$10,$10,$10            	# [1]  
	ldl	$17,456($sp)              	# [2]  gra_spill_temp_49
	s8subl	$10,$10,$10            	# [2]  
	ldl	$11,A($gp)                	!literal	# [3]  A
	s4addl	$10,$10,$10            	# [3]  
	sll	$20,4,$21                 	# [4]  
	sll	$20,8,$20                 	# [4]  
	s4addl	$21,$21,$19            	# [5]  
	s4subl	$21,$21,$22            	# [5]  
	s4addl	$19,$22,$19            	# [6]  
	subl	$31,$21,$21              	# [6]  
	s4addl	$20,$21,$20            	# [7]  
	sll	$19,8,$19                 	# [7]  
	sll	$16,4,$16                 	# [8]  
	addl	$19,$20,$19              	# [8]  
	s8subl	$16,$16,$18            	# [9]  
	addl	$17,$19,$17              	# [9]  
	s4addl	$16,$18,$16            	# [10]  
	stl	$13,112($sp)              	# [10]  gra_spill_temp_6
	ldi	$13,slave($31)            	!tprello	# [11]  slave
	stl	$16,216($sp)              	# [11]  gra_spill_temp_19
	stl	$13,712($sp)              	# [12]  gra_spill_temp_81
	addl	$10,$13,$10              	# [12]  
	ldi	$13,568($31)              	# [13]  
	addl	$16,$17,$16              	# [13]  
	addl	$11,$16,$11              	# [14]  
	ldih	$13,786($13)             	# [14]  
	ldi	$9,29680($31)             	# [15]  
	addl	$11,$13,$11              	# [15]  
	ldih	$9,1($9)                 	# [16]  
	mov	$31,$13                   	# [16]  
	stl	$10,424($sp)              	# [17]  gra_spill_temp_45
#Block: 200 Pred: 15 Succ: 17 
.L_BB200_stencil_core:	# 0x2ba8
#<freq>
#<freq> BB:200 frequency = 0.06212 (heuristic)
#<freq>
#Block: 17 Pred: 18 200 Succ: 18 
	.align	4
.Lt_1_126:	# 0x2ba8
#<loop> Loop body line 113, nesting depth: 1, estimated iterations: 100
#<freq>
#<freq> BB:17 frequency = 6.21174 (heuristic)
#<freq>
	.loc	1	122	0
	mov	160,$22                   	# [0]  
	mov	16,$23                    	# [0]  
	stl	$23,0($sp)                	# [1]  id:1811
	mov	$31,$21                   	# [1]  
	stl	$22,8($sp)                	# [2]  id:1812
	mov	$12,$20                   	# [2]  
	ldi	$19,1120($31)             	# [3]  
	mov	$10,$18                   	# [3]  
	mov	$11,$17                   	# [4]  
	mov	$31,$16                   	# [4]  
	.globl	athread_get
	bsr	$26,athread_get           	# [5]  athread_get
#Block: 18 Pred: 17 Succ: 17 201 
.L_BB18_stencil_core:	# 0x2bd4
#<loop> Part of loop body line 113, head labeled .Lt_1_126
#<freq>
#<freq> BB:18 frequency = 6.21174 (heuristic)
#<freq> BB:18 => BB:17 probability = 0.99000
#<freq> BB:18 => BB:201 probability = 0.01000
#<freq>
	addw	$13,1,$13                	# [5]  
	addl	$11,$9,$11               	# [5]  
	cmpeq	$13,$14,$24             	# [6]  
	ldi	$10,1120($10)             	# [6]  
#<bpre> branch predict taken
	beq	$24,.Lt_1_126             	# [7]  
#Block: 201 Pred: 18 Succ: 193 
.L_BB201_stencil_core:	# 0x2be8
#<freq>
#<freq> BB:201 frequency = 0.06212 (heuristic)
#<freq>
#Block: 193 Pred: 201 Succ: 23 
.L_BB193_stencil_core:	# 0x2be8
#<freq>
#<freq> BB:193 frequency = 0.06212 (heuristic)
#<freq>
	ldl	$11,A($gp)                	!literal	# [0]  A
	.loc	1	123	0
	mov	$14,$5                    	# [0]  
	ldl	$13,112($sp)              	# [1]  gra_spill_temp_6
	stl	$15,264($sp)              	# [2]  gra_spill_temp_25
	br	$31,.Lt_1_120              	# [3]  
#Block: 20 Pred: 14 Succ: 23 
.Lt_1_123:	# 0x2bfc
#<freq>
#<freq> BB:20 frequency = 0.08973 (heuristic)
#<freq>
	.loc	1	122	0
	ldl	$28,464($sp)              	# [0]  gra_spill_temp_50
#	.spillsp $15, 0
	sll	$13,5,$27                 	# [0]  
	s8subl	$27,$27,$27            	# [1]  
#	.restorereg $15
	ldi	$25,slave($31)            	!tprello	# [1]  slave
	s8subl	$27,$27,$27            	# [2]  
	stl	$25,712($sp)              	# [2]  gra_spill_temp_81
	s4addl	$27,$27,$27            	# [3]  
	ldl	$11,A($gp)                	!literal	# [3]  A
	sll	$28,4,$28                 	# [4]  
	addl	$25,$27,$25              	# [4]  
	s8subl	$28,$28,$1             	# [5]  
	stl	$25,424($sp)              	# [5]  gra_spill_temp_45
	s4addl	$28,$1,$28             	# [6]  
	stl	$15,264($sp)              	# [6]  gra_spill_temp_25
	stl	$28,216($sp)              	# [7]  gra_spill_temp_19
	.loc	1	123	0
	mov	$14,$5                    	# [7]  
#	.spillsp $15, 0
	br	$31,.Lt_1_120              	# [8]  
#Block: 75 Pred: 72 Succ: 76 
.Lt_1_322:	# 0x2c40
#<freq>
#<freq> BB:75 frequency = 0.12500 (heuristic)
#<freq>
	.loc	1	183	0
	ldl	$8,272($sp)               	# [0]  gra_spill_temp_26
	sll	$13,2,$16                 	# [0]  
	ldl	$18,464($sp)              	# [1]  gra_spill_temp_50
	s8subl	$16,$16,$16            	# [1]  
	ldl	$20,664($sp)              	# [2]  gra_spill_temp_75
	ldi	$7,27892($31)             	# [2]  
	ldi	$6,-27263($31)            	# [3]  
	ldih	$7,16310($7)             	# [3]  
	sll	$8,2,$8                   	# [4]  
	ldih	$6,16308($6)             	# [4]  
	s8subl	$8,$8,$8               	# [5]  
	s8subl	$16,$16,$16            	# [5]  
	s8subl	$8,$8,$8               	# [6]  
	subw	$10,$18,$18              	# [6]  
	mov	4,$19                     	# [7]  
	mov	3,$17                     	# [7]  
	ldi	$4,11639($31)             	# [8]  
	ldi	$5,-8913($31)             	# [8]  
	ldih	$5,1573($5)              	# [9]  
	ldih	$4,7969($4)              	# [9]  
	cmple	$17,$18,$17             	# [10]  
	cmple	$19,$20,$19             	# [10]  
	s4addl	$8,$8,$8               	# [11]  
	s4addl	$16,$16,$16            	# [11]  
	sll	$6,32,$6                  	# [12]  
	sll	$7,32,$7                  	# [12]  
	addl	$4,$7,$4                 	# [13]  
	addl	$5,$6,$5                 	# [13]  
	stl	$16,720($sp)              	# [14]  gra_spill_temp_82
	stl	$8,704($sp)               	# [15]  gra_spill_temp_80
	stl	$19,576($sp)              	# [16]  gra_spill_temp_64
	stl	$17,632($sp)              	# [17]  gra_spill_temp_71
	stl	$18,568($sp)              	# [18]  gra_spill_temp_63
	br	$31,.Lt_1_177              	# [19]  
#Block: 57 Pred: 46 Succ: 58 68 
.Lt_1_152:	# 0x2cc8
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:57 frequency = 0.08955 (heuristic)
#<freq> BB:57 => BB:58 probability = 0.84000
#<freq> BB:57 => BB:68 probability = 0.16000
#<freq>
	ldl	$16,576($sp)              	# [0]  gra_spill_temp_64
	stl	$31,616($sp)              	# [1]  gra_spill_temp_69
#<bpre> branch predict not taken
	beq	$16,.Lt_1_165.bpre        	# [4]  
#Block: 58 Pred: 57 Succ: 56 317 
.L_BB58_stencil_core:	# 0x2cd4
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:58 frequency = 0.07522 (heuristic)
#<freq> BB:58 => BB:56 probability = 0.84000
#<freq> BB:58 => BB:317 probability = 0.16000
#<freq>
	ldl	$17,632($sp)              	# [0]  gra_spill_temp_71
#<bpre> branch predict taken
	bne	$17,.Lt_1_306             	# [4]  
#Block: 317 Pred: 58 Succ: 68 
.L_BB317_stencil_core:	# 0x2cdc
#<loop> Part of loop body line 177, head labeled .Lt_1_150
#<freq>
#<freq> BB:317 frequency = 0.01204 (heuristic)
#<freq>
	br	$31,.Lt_1_165              	# [0]  
#Block: 172 Pred: 161 Succ: 170 318 
.Lt_1_273:	# 0x2ce0
#<freq>
#<freq> BB:172 frequency = 0.05970 (heuristic)
#<freq> BB:172 => BB:170 probability = 0.84000
#<freq> BB:172 => BB:318 probability = 0.16000
#<freq>
	.loc	1	351	0
	ldl	$18,552($sp)              	# [0]  gra_spill_temp_61
	stl	$31,544($sp)              	# [1]  gra_spill_temp_60
#<bpre> branch predict taken
	bne	$18,.Lt_1_313             	# [4]  
#Block: 318 Pred: 172 Succ: 181 
.L_BB318_stencil_core:	# 0x2cec
#<freq>
#<freq> BB:318 frequency = 0.00955 (heuristic)
#<freq>
	br	$31,.Lt_1_286              	# [0]  
#Block: 11 Pred: 10 Succ: 12 
.L_BB11_stencil_core:	# 0x2cf0
#<freq>
#<freq> BB:11 frequency = 0.05098 (heuristic)
#<freq>
	.loc	1	113	0
	ldl	$16,.rodata($gp)          	!literal	# [0]  .rodata
	stl	$14,280($sp)              	# [1]  gra_spill_temp_27
	.globl	printf
	bsr	$26,printf                	# [2]  printf
#Block: 12 Pred: 11 Succ: 23 
.L_BB12_stencil_core:	# 0x2cfc
#<freq>
#<freq> BB:12 frequency = 0.05098 (heuristic)
#<freq>
#	.restorereg $15
	ldl	$21,464($sp)              	# [0]  gra_spill_temp_50
	sll	$13,5,$24                 	# [0]  
	ldl	$19,520($sp)              	# [1]  gra_spill_temp_57
	s8subl	$24,$24,$24            	# [1]  
	ldl	$20,256($sp)              	# [2]  gra_spill_temp_24
	s8subl	$24,$24,$24            	# [2]  
	s4addl	$24,$24,$24            	# [3]  
	ldi	$23,slave($31)            	!tprello	# [3]  slave
	sll	$21,4,$21                 	# [4]  
	stl	$23,712($sp)              	# [4]  gra_spill_temp_81
	s8subl	$21,$21,$22            	# [5]  
	addl	$23,$24,$23              	# [5]  
	s4addl	$21,$22,$21            	# [6]  
	subw	$20,$19,$14              	# [6]  
	cmplt	$19,$20,$19             	# [7]  
	ldl	$11,A($gp)                	!literal	# [7]  A
	stl	$19,448($sp)              	# [8]  gra_spill_temp_48
	mov	$31,$5                    	# [8]  
	stl	$21,216($sp)              	# [9]  gra_spill_temp_19
	stl	$23,424($sp)              	# [10]  gra_spill_temp_45
	stl	$15,264($sp)              	# [11]  gra_spill_temp_25
	br	$31,.Lt_1_120              	# [12]  
#Block: 4 Pred: 3 Succ: 5 
.L_BB4_stencil_core:	# 0x2d54
#<freq>
#<freq> BB:4 frequency = 0.04211 (heuristic)
#<freq>
	.loc	1	96	0
	mov	2,$16                     	# [18]  
#	.spillsp $15, 0
	.globl	ldm_set_datatiles
	bsr	$26,ldm_set_datatiles     	# [18]  ldm_set_datatiles
#Block: 5 Pred: 4 Succ: 6 
.L_BB5_stencil_core:	# 0x2d5c
#<freq>
#<freq> BB:5 frequency = 0.04211 (heuristic)
#<freq>
	.loc	1	97	0
	ldl	$22,64($sp)               	# [0]  gra_spill_temp_0
#	.restorereg $13
#	.restorereg $15
	mov	1,$23                     	# [0]  
	stw	$23,0($22)                	# [4]  id:1371 amt_flag+0x0
	br	$31,.Lt_1_116              	# [5]  
#Block: 92 Pred: 81 Succ: 93 103 
.Lt_1_182:	# 0x2d6c
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:92 frequency = 0.02985 (heuristic)
#<freq> BB:92 => BB:93 probability = 0.84000
#<freq> BB:92 => BB:103 probability = 0.16000
#<freq>
	.loc	1	183	0
	ldl	$24,576($sp)              	# [0]  gra_spill_temp_64
	mov	$31,$11                   	# [0]  
#<bpre> branch predict not taken
	beq	$24,.Lt_1_195.bpre        	# [4]  
#Block: 93 Pred: 92 Succ: 91 319 
.L_BB93_stencil_core:	# 0x2d78
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:93 frequency = 0.02507 (heuristic)
#<freq> BB:93 => BB:91 probability = 0.84000
#<freq> BB:93 => BB:319 probability = 0.16000
#<freq>
#	.spillsp $13, 0
#	.spillsp $15, 0
	ldl	$25,632($sp)              	# [0]  gra_spill_temp_71
#<bpre> branch predict taken
	bne	$25,.Lt_1_308             	# [4]  
#Block: 319 Pred: 93 Succ: 103 
.L_BB319_stencil_core:	# 0x2d80
#<loop> Part of loop body line 183, head labeled .Lt_1_180
#<freq>
#<freq> BB:319 frequency = 0.00401 (heuristic)
#<freq>
	br	$31,.Lt_1_195              	# [0]  
.Lt_1_169.bpre:
	br .Lt_1_169
.Lt_1_199.bpre:
	br .Lt_1_199
.Lt_1_180.bpre:
	br .Lt_1_180
.Lt_1_323.bpre:
	br .Lt_1_323
.Lt_1_290.bpre:
	br .Lt_1_290
.Lt_1_165.bpre:
	br .Lt_1_165
.Lt_1_195.bpre:
	br .Lt_1_195
.L_CC_stencil_core:
#PU cycle count: 9263.371094
	.end	stencil_core

	.section .rodata
	.org 0x0
	.align	0
	# offset 0
	.byte	0x41, 0x72, 0x72, 0x61, 0x79, 0x20, 0x61, 0x73	# Array as
	.byte	0x73, 0x69, 0x67, 0x6e, 0x6d, 0x65, 0x6e, 0x74	# signment
	.byte	0x20, 0x66, 0x61, 0x69, 0x6c, 0x65, 0x64, 0xa	#  failed\n
	.byte	0x0	# \000
	.org 0x20
	.align	0
	# offset 32
	.ascii	"\x77\x2d\x21\x1f\xf4\x6c\xb6\x3f"	# double 0.0876000
	.org 0x28
	.align	0
	# offset 40
	.ascii	"\x2f\xdd\x24\x06\x81\x95\xb3\x3f"	# double 0.0765000
	.section .bss
	.align 3
	.section .tdata
	.align 0
	.section .tdata_local
	.align 4
	.section .tdata_local_fix
	.align 4
	.section .text1
	.align 4
	.section .rodata
	.align 3
#	.gpvalue 0

	.section .debug_info, "", "progbits"
	.align	0
	.byte	0x6e, 0x00, 0x00, 0x00, 0x02, 0x00
	.long	.debug_abbrev
	.byte	0x08, 0x01, 0x33, 0x64, 0x37, 0x70, 0x5f, 0x72
	.byte	0x65, 0x75, 0x73, 0x65, 0x5f, 0x76, 0x31, 0x5f
	.byte	0x75, 0x6e, 0x68, 0x69, 0x64, 0x65, 0x2e, 0x63
	.byte	0x00, 0x2d, 0x4f, 0x33, 0x00, 0x01, 0x00
	.long	.debug_line
	.byte	0x02, 0x01, 0x36, 0x72, 0x74, 0x63, 0x5f, 0x00
	.byte	0x01, 0x03, 0x92, 0x1e, 0x10
	.quad	.L_BB1_rtc_
	.quad	.L_CC_rtc_
	.byte	0x02, 0x01, 0x3e, 0x73, 0x74, 0x65, 0x6e, 0x63
	.byte	0x69, 0x6c, 0x5f, 0x63, 0x6f, 0x72, 0x65, 0x00
	.byte	0x01, 0x04, 0x92, 0x1e, 0xc0, 0x06
	.quad	.L_BB1_stencil_core
	.quad	.L_CC_stencil_core
	.byte	0x00, 0x00

	.section .debug_aranges, "", "progbits"
	.align	0
	.byte	0x2c, 0x00, 0x00, 0x00, 0x02, 0x00
	.long	.debug_info
	.byte	0x08, 0x00, 0x00, 0x00, 0x00, 0x00
	.quad	.L_BB1_rtc_
	.quad	.L_CC_stencil_core - .L_BB1_rtc_
	.byte	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00
	.byte	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00

	.section .debug_pubnames, "", "progbits"
	.align	0
	.byte	0x28, 0x00, 0x00, 0x00, 0x02, 0x00
	.long	.debug_info
	.byte	0x00, 0x00, 0x00, 0x00, 0x2d, 0x00, 0x00, 0x00
	.byte	0x72, 0x74, 0x63, 0x5f, 0x00, 0x4a, 0x00, 0x00
	.byte	0x00, 0x73, 0x74, 0x65, 0x6e, 0x63, 0x69, 0x6c
	.byte	0x5f, 0x63, 0x6f, 0x72, 0x65, 0x00, 0x00, 0x00
	.byte	0x00, 0x00

	.section .debug_abbrev, "", "progbits"
	.align	0
	.byte	0x01, 0x11, 0x01, 0x03, 0x08, 0x25, 0x08, 0x13
	.byte	0x0b, 0x42, 0x0b, 0x10, 0x06, 0x00, 0x00, 0x02
	.byte	0x2e, 0x00, 0x3a, 0x0b, 0x3b, 0x0b, 0x03, 0x08
	.byte	0x3f, 0x0c, 0x40, 0x0a, 0x11, 0x01, 0x12, 0x01
	.byte	0x00, 0x00
	.ident	"#SWCC Version 3.1.0-483 : 3d7p_reuse_v1_unhide.c compiled with : -TENV:PIC -m1 -O3 "
